{"global_step": 230001, "acc_step": 0, "speed/wps": 76.09946119768794, "speed/FLOPS": 3363206672585.2476, "speed/curr_iter_time": 120.096, "speed/data_load_time": 94.5904, "speed/curr_step_time": 120.096, "speed/est_time_elapsed": "319.7 days", "speed/est_time_remaining": "12.51 days", "speed/est_time_elapsed_hrs": 7672.83, "speed/est_time_elapsed_days": 319.7, "speed/est_time_remaining_hrs": 300.21, "speed/est_time_remaining_days": 12.51, "optim/grad_norm": 0.04446012154221535, "optim/lr": 3.192484921091469e-05, "optim/total_tokens": 1929388228608, "memory/max_active_gib": 81.95657110214233, "memory/max_active_pct": 64.0285711735487, "memory/max_reserved_gib": 83.50390625, "memory/max_reserved_pct": 65.2374267578125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3118090629577637, "created_at": "2025-06-03T03:31:31.676939+00:00"} {"global_step": 230002, "acc_step": 0, "speed/wps": 4242.486964745406, "speed/FLOPS": 187496208824947.44, "speed/curr_iter_time": 3.859, "speed/data_load_time": 0.001, "speed/curr_step_time": 3.859, "speed/est_time_elapsed": "10.27 days", "speed/est_time_remaining": "9.65 hours", "speed/est_time_elapsed_hrs": 246.55, "speed/est_time_elapsed_days": 10.27, "speed/est_time_remaining_hrs": 9.65, "speed/est_time_remaining_days": 0.4, "optim/grad_norm": 0.042861130088567734, "optim/lr": 3.192147862530837e-05, "optim/total_tokens": 1929396617216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.297986388206482, "created_at": "2025-06-03T03:31:35.550946+00:00"} {"global_step": 230003, "acc_step": 0, "speed/wps": 5598.806898979758, "speed/FLOPS": 247438607643349.94, "speed/curr_iter_time": 2.9252, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9252, "speed/est_time_elapsed": "7.79 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 186.89, "speed/est_time_elapsed_days": 7.79, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04528859630227089, "optim/lr": 3.191793140021382e-05, "optim/total_tokens": 1929405005824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.300289273262024, "created_at": "2025-06-03T03:31:38.485516+00:00"} {"global_step": 230004, "acc_step": 0, "speed/wps": 5557.080210394255, "speed/FLOPS": 245594501584424.06, "speed/curr_iter_time": 2.9474, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9474, "speed/est_time_elapsed": "7.85 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 188.31, "speed/est_time_elapsed_days": 7.85, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04237978905439377, "optim/lr": 3.191438417511949e-05, "optim/total_tokens": 1929413394432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3253506422042847, "created_at": "2025-06-03T03:31:41.441916+00:00"} {"global_step": 230005, "acc_step": 0, "speed/wps": 5551.551696209722, "speed/FLOPS": 245350169554968.5, "speed/curr_iter_time": 2.9495, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9495, "speed/est_time_elapsed": "7.85 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 188.44, "speed/est_time_elapsed_days": 7.85, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04301590099930763, "optim/lr": 3.191083695002495e-05, "optim/total_tokens": 1929421783040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3194760084152222, "created_at": "2025-06-03T03:31:44.400736+00:00"} {"global_step": 230006, "acc_step": 0, "speed/wps": 5529.34243162896, "speed/FLOPS": 244368633737820.06, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.26, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042491085827350616, "optim/lr": 3.19072897249304e-05, "optim/total_tokens": 1929430171648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2939505577087402, "created_at": "2025-06-03T03:31:47.371298+00:00"} {"global_step": 230007, "acc_step": 0, "speed/wps": 5525.527722617794, "speed/FLOPS": 244200043124977.28, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.39, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041967812925577164, "optim/lr": 3.1903742499835856e-05, "optim/total_tokens": 1929438560256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3070135116577148, "created_at": "2025-06-03T03:31:50.345342+00:00"} {"global_step": 230008, "acc_step": 0, "speed/wps": 5545.937863096848, "speed/FLOPS": 245102066865582.16, "speed/curr_iter_time": 2.9525, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9525, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 188.64, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0434415228664875, "optim/lr": 3.190019527474153e-05, "optim/total_tokens": 1929446948864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3093315362930298, "created_at": "2025-06-03T03:31:53.307344+00:00"} {"global_step": 230009, "acc_step": 0, "speed/wps": 5526.1448924528795, "speed/FLOPS": 244227318872726.47, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.37, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04246861860156059, "optim/lr": 3.189664804964698e-05, "optim/total_tokens": 1929455337472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3021913766860962, "created_at": "2025-06-03T03:31:56.279485+00:00"} {"global_step": 230010, "acc_step": 0, "speed/wps": 5531.869786394499, "speed/FLOPS": 244480329882282.5, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.18, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.056476909667253494, "optim/lr": 3.189310082455244e-05, "optim/total_tokens": 1929463726080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.30154287815094, "created_at": "2025-06-03T03:31:59.248256+00:00"} {"global_step": 230011, "acc_step": 0, "speed/wps": 5540.64159873743, "speed/FLOPS": 244867999089634.38, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 188.88, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04580334573984146, "optim/lr": 3.188955359945789e-05, "optim/total_tokens": 1929472114688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3019160032272339, "created_at": "2025-06-03T03:32:02.213908+00:00"} {"global_step": 230012, "acc_step": 0, "speed/wps": 5521.994054025701, "speed/FLOPS": 244043873060162.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.45, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04476410150527954, "optim/lr": 3.188600637436356e-05, "optim/total_tokens": 1929480503296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3042027950286865, "created_at": "2025-06-03T03:32:05.187101+00:00"} {"global_step": 230013, "acc_step": 0, "speed/wps": 5507.605913912143, "speed/FLOPS": 243407990912320.16, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.42 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.42, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.051688238978385925, "optim/lr": 3.188245914926902e-05, "optim/total_tokens": 1929488891904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3141019344329834, "created_at": "2025-06-03T03:32:08.170836+00:00"} {"global_step": 230014, "acc_step": 0, "speed/wps": 5518.395873738909, "speed/FLOPS": 243884851908642.3, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.41 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.41, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04328198730945587, "optim/lr": 3.187891192417447e-05, "optim/total_tokens": 1929497280512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3080506324768066, "created_at": "2025-06-03T03:32:11.145466+00:00"} {"global_step": 230015, "acc_step": 0, "speed/wps": 5514.686695871325, "speed/FLOPS": 243720925232188.47, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.41 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.41, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04320775717496872, "optim/lr": 3.1875364699079925e-05, "optim/total_tokens": 1929505669120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.311832308769226, "created_at": "2025-06-03T03:32:14.123816+00:00"} {"global_step": 230016, "acc_step": 0, "speed/wps": 5533.122800085057, "speed/FLOPS": 244535706673899.7, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.14, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04315410181879997, "optim/lr": 3.18718174739856e-05, "optim/total_tokens": 1929514057728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.307748794555664, "created_at": "2025-06-03T03:32:17.092895+00:00"} {"global_step": 230017, "acc_step": 0, "speed/wps": 5533.553574598786, "speed/FLOPS": 244554744702502.7, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.13, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04945346713066101, "optim/lr": 3.186827024889105e-05, "optim/total_tokens": 1929522446336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3062304258346558, "created_at": "2025-06-03T03:32:20.062557+00:00"} {"global_step": 230018, "acc_step": 0, "speed/wps": 5514.646102626717, "speed/FLOPS": 243719131218551.84, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.41 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.41, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0472959466278553, "optim/lr": 3.1864723023796506e-05, "optim/total_tokens": 1929530834944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2986605167388916, "created_at": "2025-06-03T03:32:23.042091+00:00"} {"global_step": 230019, "acc_step": 0, "speed/wps": 5520.990332086023, "speed/FLOPS": 243999513687943.1, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.044247571378946304, "optim/lr": 3.186117579870218e-05, "optim/total_tokens": 1929539223552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.308000922203064, "created_at": "2025-06-03T03:32:26.014984+00:00"} {"global_step": 230020, "acc_step": 0, "speed/wps": 5528.247985578229, "speed/FLOPS": 244320264824260.5, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.03938888758420944, "optim/lr": 3.185762857360763e-05, "optim/total_tokens": 1929547612160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3042495250701904, "created_at": "2025-06-03T03:32:28.982916+00:00"} {"global_step": 230021, "acc_step": 0, "speed/wps": 5507.559293426473, "speed/FLOPS": 243405930525478.84, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.42 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.42, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04349526762962341, "optim/lr": 3.185408134851309e-05, "optim/total_tokens": 1929556000768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3099192380905151, "created_at": "2025-06-03T03:32:31.965658+00:00"} {"global_step": 230022, "acc_step": 0, "speed/wps": 5502.260673906121, "speed/FLOPS": 243171758663472.56, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.42 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.42, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04482492431998253, "optim/lr": 3.185053412341854e-05, "optim/total_tokens": 1929564389376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2950176000595093, "created_at": "2025-06-03T03:32:34.948144+00:00"} {"global_step": 230023, "acc_step": 0, "speed/wps": 5494.954914721485, "speed/FLOPS": 242848881501777.0, "speed/curr_iter_time": 2.9809, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9809, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.43 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.43, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04052675887942314, "optim/lr": 3.184698689832422e-05, "optim/total_tokens": 1929572777984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.321685552597046, "created_at": "2025-06-03T03:32:37.935451+00:00"} {"global_step": 230024, "acc_step": 0, "speed/wps": 5523.319568027211, "speed/FLOPS": 244102453994433.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.49, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042148854583501816, "optim/lr": 3.184343967322967e-05, "optim/total_tokens": 1929581166592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3131951093673706, "created_at": "2025-06-03T03:32:40.908158+00:00"} {"global_step": 230025, "acc_step": 0, "speed/wps": 5527.15489827123, "speed/FLOPS": 244271955960219.16, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.3, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0423436276614666, "optim/lr": 3.183989244813512e-05, "optim/total_tokens": 1929589555200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3146077394485474, "created_at": "2025-06-03T03:32:43.878771+00:00"} {"global_step": 230026, "acc_step": 0, "speed/wps": 5530.773477699457, "speed/FLOPS": 244431878649378.22, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.23, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04102912172675133, "optim/lr": 3.1836345223040575e-05, "optim/total_tokens": 1929597943808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2999420166015625, "created_at": "2025-06-03T03:32:46.848597+00:00"} {"global_step": 230027, "acc_step": 0, "speed/wps": 5513.647037177885, "speed/FLOPS": 243674977639394.03, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04190303012728691, "optim/lr": 3.183279799794625e-05, "optim/total_tokens": 1929606332416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3066339492797852, "created_at": "2025-06-03T03:32:49.826875+00:00"} {"global_step": 230028, "acc_step": 0, "speed/wps": 5517.489932029045, "speed/FLOPS": 243844813922096.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04209239408373833, "optim/lr": 3.1829250772851706e-05, "optim/total_tokens": 1929614721024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3059087991714478, "created_at": "2025-06-03T03:32:52.805668+00:00"} {"global_step": 230029, "acc_step": 0, "speed/wps": 5516.398553008303, "speed/FLOPS": 243796580555563.75, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040972139686346054, "optim/lr": 3.1825703547757156e-05, "optim/total_tokens": 1929623109632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3072839975357056, "created_at": "2025-06-03T03:32:55.784652+00:00"} {"global_step": 230030, "acc_step": 0, "speed/wps": 5511.738025390618, "speed/FLOPS": 243590609089604.9, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04196644574403763, "optim/lr": 3.1822156322662607e-05, "optim/total_tokens": 1929631498240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3042727708816528, "created_at": "2025-06-03T03:32:58.763219+00:00"} {"global_step": 230031, "acc_step": 0, "speed/wps": 5519.302435943115, "speed/FLOPS": 243924917317862.2, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04180702194571495, "optim/lr": 3.181860909756829e-05, "optim/total_tokens": 1929639886848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3276761770248413, "created_at": "2025-06-03T03:33:01.739767+00:00"} {"global_step": 230032, "acc_step": 0, "speed/wps": 5515.138119903075, "speed/FLOPS": 243740875863794.16, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04021088033914566, "optim/lr": 3.181506187247374e-05, "optim/total_tokens": 1929648275456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3022836446762085, "created_at": "2025-06-03T03:33:04.715364+00:00"} {"global_step": 230033, "acc_step": 0, "speed/wps": 5521.723601584763, "speed/FLOPS": 244031920446573.88, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04230045527219772, "optim/lr": 3.1811514647379194e-05, "optim/total_tokens": 1929656664064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3025134801864624, "created_at": "2025-06-03T03:33:07.687181+00:00"} {"global_step": 230034, "acc_step": 0, "speed/wps": 5520.4833732185, "speed/FLOPS": 243977108700849.28, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041724879294633865, "optim/lr": 3.1807967422284645e-05, "optim/total_tokens": 1929665052672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3142945766448975, "created_at": "2025-06-03T03:33:10.662154+00:00"} {"global_step": 230035, "acc_step": 0, "speed/wps": 5507.336124603827, "speed/FLOPS": 243396067605799.47, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040332693606615067, "optim/lr": 3.180442019719032e-05, "optim/total_tokens": 1929673441280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3148024082183838, "created_at": "2025-06-03T03:33:13.645189+00:00"} {"global_step": 230036, "acc_step": 0, "speed/wps": 5507.944495202785, "speed/FLOPS": 243422954472350.4, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.41 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.41, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040913667529821396, "optim/lr": 3.1800872972095775e-05, "optim/total_tokens": 1929681829888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3046395778656006, "created_at": "2025-06-03T03:33:16.626449+00:00"} {"global_step": 230037, "acc_step": 0, "speed/wps": 5507.878481433073, "speed/FLOPS": 243420037001618.22, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04332950338721275, "optim/lr": 3.1797325747001226e-05, "optim/total_tokens": 1929690218496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2980501651763916, "created_at": "2025-06-03T03:33:19.606058+00:00"} {"global_step": 230038, "acc_step": 0, "speed/wps": 5531.527489468552, "speed/FLOPS": 244465202110190.12, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.16, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04256786033511162, "optim/lr": 3.179377852190668e-05, "optim/total_tokens": 1929698607104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2986574172973633, "created_at": "2025-06-03T03:33:22.574143+00:00"} {"global_step": 230039, "acc_step": 0, "speed/wps": 5512.611606122042, "speed/FLOPS": 243629216886542.34, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0408458448946476, "optim/lr": 3.1790231296812356e-05, "optim/total_tokens": 1929706995712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3135321140289307, "created_at": "2025-06-03T03:33:25.551392+00:00"} {"global_step": 230040, "acc_step": 0, "speed/wps": 5516.153287262424, "speed/FLOPS": 243785741064979.8, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04150072857737541, "optim/lr": 3.178668407171781e-05, "optim/total_tokens": 1929715384320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3228002786636353, "created_at": "2025-06-03T03:33:28.529200+00:00"} {"global_step": 230041, "acc_step": 0, "speed/wps": 5516.400415984528, "speed/FLOPS": 243796662889577.34, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04399152100086212, "optim/lr": 3.1783136846623264e-05, "optim/total_tokens": 1929723772928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2917650938034058, "created_at": "2025-06-03T03:33:31.504630+00:00"} {"global_step": 230042, "acc_step": 0, "speed/wps": 5514.082029105186, "speed/FLOPS": 243694202056090.2, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04065658897161484, "optim/lr": 3.1779589621528714e-05, "optim/total_tokens": 1929732161536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3088399171829224, "created_at": "2025-06-03T03:33:34.481453+00:00"} {"global_step": 230043, "acc_step": 0, "speed/wps": 5520.670768644433, "speed/FLOPS": 243985390619498.78, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04234984889626503, "optim/lr": 3.177604239643439e-05, "optim/total_tokens": 1929740550144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3055356740951538, "created_at": "2025-06-03T03:33:37.454200+00:00"} {"global_step": 230044, "acc_step": 0, "speed/wps": 5510.953933207472, "speed/FLOPS": 243555956228457.47, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04175304248929024, "optim/lr": 3.1772495171339845e-05, "optim/total_tokens": 1929748938752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3041151762008667, "created_at": "2025-06-03T03:33:40.436165+00:00"} {"global_step": 230045, "acc_step": 0, "speed/wps": 5520.774896379578, "speed/FLOPS": 243989992532418.16, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0417504720389843, "optim/lr": 3.1768947946245295e-05, "optim/total_tokens": 1929757327360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3081629276275635, "created_at": "2025-06-03T03:33:43.408150+00:00"} {"global_step": 230046, "acc_step": 0, "speed/wps": 5521.003148192668, "speed/FLOPS": 244000080094258.03, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.58, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.15079058706760406, "optim/lr": 3.176540072115097e-05, "optim/total_tokens": 1929765715968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3002948760986328, "created_at": "2025-06-03T03:33:46.380733+00:00"} {"global_step": 230047, "acc_step": 0, "speed/wps": 5507.988235375582, "speed/FLOPS": 243424887564105.53, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040677689015865326, "optim/lr": 3.1761853496056426e-05, "optim/total_tokens": 1929774104576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3067716360092163, "created_at": "2025-06-03T03:33:49.362795+00:00"} {"global_step": 230048, "acc_step": 0, "speed/wps": 5506.265360191501, "speed/FLOPS": 243348745299443.75, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.18664202094078064, "optim/lr": 3.1758306270961876e-05, "optim/total_tokens": 1929782493184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3044872283935547, "created_at": "2025-06-03T03:33:52.345713+00:00"} {"global_step": 230049, "acc_step": 0, "speed/wps": 5502.81160691542, "speed/FLOPS": 243196107082552.8, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.4 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.4, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.05477311834692955, "optim/lr": 3.175475904586733e-05, "optim/total_tokens": 1929790881792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.303222417831421, "created_at": "2025-06-03T03:33:55.329309+00:00"} {"global_step": 230050, "acc_step": 0, "speed/wps": 5525.394318737782, "speed/FLOPS": 244194147356303.7, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.43, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.058578066527843475, "optim/lr": 3.175121182077301e-05, "optim/total_tokens": 1929799270400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3075910806655884, "created_at": "2025-06-03T03:33:58.304566+00:00"} {"global_step": 230051, "acc_step": 0, "speed/wps": 5509.088394042261, "speed/FLOPS": 243473508946050.22, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.050655726343393326, "optim/lr": 3.1747664595678464e-05, "optim/total_tokens": 1929807659008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3007837533950806, "created_at": "2025-06-03T03:34:01.283544+00:00"} {"global_step": 230052, "acc_step": 0, "speed/wps": 5509.922396559087, "speed/FLOPS": 243510367588482.06, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04979061335325241, "optim/lr": 3.1744117370583914e-05, "optim/total_tokens": 1929816047616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2990790605545044, "created_at": "2025-06-03T03:34:04.261306+00:00"} {"global_step": 230053, "acc_step": 0, "speed/wps": 5514.796493116303, "speed/FLOPS": 243725777708423.25, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04418467357754707, "optim/lr": 3.1740570145489364e-05, "optim/total_tokens": 1929824436224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3098918199539185, "created_at": "2025-06-03T03:34:07.237117+00:00"} {"global_step": 230054, "acc_step": 0, "speed/wps": 5517.686084826446, "speed/FLOPS": 243853482871740.44, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0442020446062088, "optim/lr": 3.1737022920395045e-05, "optim/total_tokens": 1929832824832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.298317551612854, "created_at": "2025-06-03T03:34:10.214555+00:00"} {"global_step": 230055, "acc_step": 0, "speed/wps": 5515.984306433391, "speed/FLOPS": 243778272977258.84, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04684342443943024, "optim/lr": 3.1733475695300495e-05, "optim/total_tokens": 1929841213440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2958154678344727, "created_at": "2025-06-03T03:34:13.190031+00:00"} {"global_step": 230056, "acc_step": 0, "speed/wps": 5507.732056388177, "speed/FLOPS": 243413565764105.16, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04542912170290947, "optim/lr": 3.172992847020595e-05, "optim/total_tokens": 1929849602048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.31475830078125, "created_at": "2025-06-03T03:34:16.169594+00:00"} {"global_step": 230057, "acc_step": 0, "speed/wps": 5514.060221989291, "speed/FLOPS": 243693238293186.56, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.047132305800914764, "optim/lr": 3.17263812451114e-05, "optim/total_tokens": 1929857990656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3019120693206787, "created_at": "2025-06-03T03:34:19.145555+00:00"} {"global_step": 230058, "acc_step": 0, "speed/wps": 5507.628334718948, "speed/FLOPS": 243408981797220.88, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.043952904641628265, "optim/lr": 3.1722834020017076e-05, "optim/total_tokens": 1929866379264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3201366662979126, "created_at": "2025-06-03T03:34:22.127858+00:00"} {"global_step": 230059, "acc_step": 0, "speed/wps": 5510.590080839365, "speed/FLOPS": 243539875816152.4, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042415469884872437, "optim/lr": 3.171928679492253e-05, "optim/total_tokens": 1929874767872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3034590482711792, "created_at": "2025-06-03T03:34:25.106424+00:00"} {"global_step": 230060, "acc_step": 0, "speed/wps": 5517.883063708417, "speed/FLOPS": 243862188330094.22, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04514642804861069, "optim/lr": 3.171573956982798e-05, "optim/total_tokens": 1929883156480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3178215026855469, "created_at": "2025-06-03T03:34:28.083059+00:00"} {"global_step": 230061, "acc_step": 0, "speed/wps": 5502.7435551206645, "speed/FLOPS": 243193099541545.25, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.39 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.39, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04243621602654457, "optim/lr": 3.171219234473344e-05, "optim/total_tokens": 1929891545088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3007347583770752, "created_at": "2025-06-03T03:34:31.068357+00:00"} {"global_step": 230062, "acc_step": 0, "speed/wps": 5513.173796631675, "speed/FLOPS": 243654062829516.22, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04334142431616783, "optim/lr": 3.1708645119639114e-05, "optim/total_tokens": 1929899933696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3006901741027832, "created_at": "2025-06-03T03:34:34.048493+00:00"} {"global_step": 230063, "acc_step": 0, "speed/wps": 5515.33336285943, "speed/FLOPS": 243749504603121.0, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04633117467164993, "optim/lr": 3.1705097894544564e-05, "optim/total_tokens": 1929908322304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3055094480514526, "created_at": "2025-06-03T03:34:37.025073+00:00"} {"global_step": 230064, "acc_step": 0, "speed/wps": 5513.918294587831, "speed/FLOPS": 243686965828492.34, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0440404936671257, "optim/lr": 3.170155066945002e-05, "optim/total_tokens": 1929916710912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3108251094818115, "created_at": "2025-06-03T03:34:40.004816+00:00"} {"global_step": 230065, "acc_step": 0, "speed/wps": 5512.143376189904, "speed/FLOPS": 243608523520159.9, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04258965700864792, "optim/lr": 3.169800344435547e-05, "optim/total_tokens": 1929925099520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3153043985366821, "created_at": "2025-06-03T03:34:42.983619+00:00"} {"global_step": 230066, "acc_step": 0, "speed/wps": 5522.111663948048, "speed/FLOPS": 244049070816747.8, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.56, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042361222207546234, "optim/lr": 3.1694456219261145e-05, "optim/total_tokens": 1929933488128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3138340711593628, "created_at": "2025-06-03T03:34:45.960650+00:00"} {"global_step": 230067, "acc_step": 0, "speed/wps": 5508.143907154259, "speed/FLOPS": 243431767459922.66, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042938265949487686, "optim/lr": 3.16909089941666e-05, "optim/total_tokens": 1929941876736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.309889793395996, "created_at": "2025-06-03T03:34:48.943073+00:00"} {"global_step": 230068, "acc_step": 0, "speed/wps": 5524.948926962681, "speed/FLOPS": 244174463319566.0, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04046083241701126, "optim/lr": 3.168736176907205e-05, "optim/total_tokens": 1929950265344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3080414533615112, "created_at": "2025-06-03T03:34:51.913462+00:00"} {"global_step": 230069, "acc_step": 0, "speed/wps": 5524.099172248273, "speed/FLOPS": 244136908510628.1, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04240109398961067, "optim/lr": 3.168381454397751e-05, "optim/total_tokens": 1929958653952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.30054771900177, "created_at": "2025-06-03T03:34:54.886648+00:00"} {"global_step": 230070, "acc_step": 0, "speed/wps": 5518.149001083458, "speed/FLOPS": 243873941400880.16, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04181358963251114, "optim/lr": 3.1680267318883183e-05, "optim/total_tokens": 1929967042560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.303098201751709, "created_at": "2025-06-03T03:34:57.861450+00:00"} {"global_step": 230071, "acc_step": 0, "speed/wps": 5516.137096689576, "speed/FLOPS": 243785025524530.78, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04605964571237564, "optim/lr": 3.1676720093788634e-05, "optim/total_tokens": 1929975431168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.3057938814163208, "created_at": "2025-06-03T03:35:00.837322+00:00"} {"global_step": 230072, "acc_step": 0, "speed/wps": 5500.923075442989, "speed/FLOPS": 243112643657851.7, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.38 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.38, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04503263533115387, "optim/lr": 3.167317286869409e-05, "optim/total_tokens": 1929983819776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.305795431137085, "created_at": "2025-06-03T03:35:03.820244+00:00"} {"global_step": 230073, "acc_step": 0, "speed/wps": 5509.984889158891, "speed/FLOPS": 243513129441527.28, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04453245550394058, "optim/lr": 3.1669625643599764e-05, "optim/total_tokens": 1929992208384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.323005199432373, "created_at": "2025-06-03T03:35:06.800591+00:00"} {"global_step": 230074, "acc_step": 0, "speed/wps": 5515.040997650522, "speed/FLOPS": 243736583557348.06, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041606683284044266, "optim/lr": 3.1666078418505215e-05, "optim/total_tokens": 1930000596992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3055626153945923, "created_at": "2025-06-03T03:35:09.779129+00:00"} {"global_step": 230075, "acc_step": 0, "speed/wps": 5517.76337967919, "speed/FLOPS": 243856898908600.78, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.051313478499650955, "optim/lr": 3.166253119341067e-05, "optim/total_tokens": 1930008985600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2974073886871338, "created_at": "2025-06-03T03:35:12.757416+00:00"} {"global_step": 230076, "acc_step": 0, "speed/wps": 5521.1298882101955, "speed/FLOPS": 244005681354318.5, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.045848943293094635, "optim/lr": 3.165898396831612e-05, "optim/total_tokens": 1930017374208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3174928426742554, "created_at": "2025-06-03T03:35:15.729486+00:00"} {"global_step": 230077, "acc_step": 0, "speed/wps": 5516.15419964163, "speed/FLOPS": 243785781387470.72, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04600617289543152, "optim/lr": 3.16554367432218e-05, "optim/total_tokens": 1930025762816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3115911483764648, "created_at": "2025-06-03T03:35:18.706835+00:00"} {"global_step": 230078, "acc_step": 0, "speed/wps": 5511.209698516805, "speed/FLOPS": 243567259746004.44, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04312900826334953, "optim/lr": 3.165188951812725e-05, "optim/total_tokens": 1930034151424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3052868843078613, "created_at": "2025-06-03T03:35:21.684462+00:00"} {"global_step": 230079, "acc_step": 0, "speed/wps": 5519.264393731677, "speed/FLOPS": 243923236046834.3, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.62, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04298844560980797, "optim/lr": 3.16483422930327e-05, "optim/total_tokens": 1930042540032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3081512451171875, "created_at": "2025-06-03T03:35:24.660999+00:00"} {"global_step": 230080, "acc_step": 0, "speed/wps": 5516.537493058814, "speed/FLOPS": 243802720994636.72, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04101487621665001, "optim/lr": 3.164479506793816e-05, "optim/total_tokens": 1930050928640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3027105331420898, "created_at": "2025-06-03T03:35:27.636490+00:00"} {"global_step": 230081, "acc_step": 0, "speed/wps": 5521.458234997771, "speed/FLOPS": 244020192601698.12, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04304086044430733, "optim/lr": 3.1641247842843834e-05, "optim/total_tokens": 1930059317248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.311493158340454, "created_at": "2025-06-03T03:35:30.611993+00:00"} {"global_step": 230082, "acc_step": 0, "speed/wps": 5514.966349900401, "speed/FLOPS": 243733284508874.53, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.042123377323150635, "optim/lr": 3.163770061774929e-05, "optim/total_tokens": 1930067705856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3175196647644043, "created_at": "2025-06-03T03:35:33.587708+00:00"} {"global_step": 230083, "acc_step": 0, "speed/wps": 5520.792993127318, "speed/FLOPS": 243990792316040.7, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.043780531734228134, "optim/lr": 3.163415339265474e-05, "optim/total_tokens": 1930076094464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3166738748550415, "created_at": "2025-06-03T03:35:36.562174+00:00"} {"global_step": 230084, "acc_step": 0, "speed/wps": 5525.623938496065, "speed/FLOPS": 244204295374319.38, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.46, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04117489606142044, "optim/lr": 3.163060616756019e-05, "optim/total_tokens": 1930084483072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3024053573608398, "created_at": "2025-06-03T03:35:39.532080+00:00"} {"global_step": 230085, "acc_step": 0, "speed/wps": 5520.618564407116, "speed/FLOPS": 243983083459414.88, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04487608000636101, "optim/lr": 3.162705894246587e-05, "optim/total_tokens": 1930092871680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.312448263168335, "created_at": "2025-06-03T03:35:42.506365+00:00"} {"global_step": 230086, "acc_step": 0, "speed/wps": 5529.94732506881, "speed/FLOPS": 244395366931736.12, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.26, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.048984311521053314, "optim/lr": 3.162351171737132e-05, "optim/total_tokens": 1930101260288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3088881969451904, "created_at": "2025-06-03T03:35:45.477701+00:00"} {"global_step": 230087, "acc_step": 0, "speed/wps": 5517.832628582577, "speed/FLOPS": 243859959355682.47, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041040848940610886, "optim/lr": 3.161996449227678e-05, "optim/total_tokens": 1930109648896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3131370544433594, "created_at": "2025-06-03T03:35:48.451497+00:00"} {"global_step": 230088, "acc_step": 0, "speed/wps": 5516.008920243718, "speed/FLOPS": 243779360781690.4, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04925958439707756, "optim/lr": 3.161641726718223e-05, "optim/total_tokens": 1930118037504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3319028615951538, "created_at": "2025-06-03T03:35:51.427683+00:00"} {"global_step": 230089, "acc_step": 0, "speed/wps": 5511.045899308096, "speed/FLOPS": 243560020659379.88, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.043362807482481, "optim/lr": 3.16128700420879e-05, "optim/total_tokens": 1930126426112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3023993968963623, "created_at": "2025-06-03T03:35:54.409221+00:00"} {"global_step": 230090, "acc_step": 0, "speed/wps": 5523.610057568554, "speed/FLOPS": 244115292145300.38, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04156254604458809, "optim/lr": 3.160932281699336e-05, "optim/total_tokens": 1930134814720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3060266971588135, "created_at": "2025-06-03T03:35:57.383109+00:00"} {"global_step": 230091, "acc_step": 0, "speed/wps": 5496.776788378088, "speed/FLOPS": 242929398992204.12, "speed/curr_iter_time": 2.9799, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9799, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.37 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.37, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04126777872443199, "optim/lr": 3.160577559189881e-05, "optim/total_tokens": 1930143203328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3018945455551147, "created_at": "2025-06-03T03:36:00.368769+00:00"} {"global_step": 230092, "acc_step": 0, "speed/wps": 5527.885247975674, "speed/FLOPS": 244304233678886.9, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.33, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04526524245738983, "optim/lr": 3.160222836680427e-05, "optim/total_tokens": 1930151591936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.312212586402893, "created_at": "2025-06-03T03:36:03.338614+00:00"} {"global_step": 230093, "acc_step": 0, "speed/wps": 5515.9156037344255, "speed/FLOPS": 243775236669616.84, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04568150267004967, "optim/lr": 3.159868114170994e-05, "optim/total_tokens": 1930159980544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3002876043319702, "created_at": "2025-06-03T03:36:06.314019+00:00"} {"global_step": 230094, "acc_step": 0, "speed/wps": 5527.039995462194, "speed/FLOPS": 244266877844185.66, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.42, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041967444121837616, "optim/lr": 3.159513391661539e-05, "optim/total_tokens": 1930168369152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3157970905303955, "created_at": "2025-06-03T03:36:09.282727+00:00"} {"global_step": 230095, "acc_step": 0, "speed/wps": 5519.74265950333, "speed/FLOPS": 243944372945955.28, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04109487682580948, "optim/lr": 3.159158669152085e-05, "optim/total_tokens": 1930176757760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.312121033668518, "created_at": "2025-06-03T03:36:12.258739+00:00"} {"global_step": 230096, "acc_step": 0, "speed/wps": 5513.604268094096, "speed/FLOPS": 243673087464802.56, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04166774824261665, "optim/lr": 3.15880394664263e-05, "optim/total_tokens": 1930185146368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3146326541900635, "created_at": "2025-06-03T03:36:15.237705+00:00"} {"global_step": 230097, "acc_step": 0, "speed/wps": 5520.119890526019, "speed/FLOPS": 243961044626314.7, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04377732053399086, "optim/lr": 3.158449224133197e-05, "optim/total_tokens": 1930193534976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3093327283859253, "created_at": "2025-06-03T03:36:18.210326+00:00"} {"global_step": 230098, "acc_step": 0, "speed/wps": 5524.013957126503, "speed/FLOPS": 244133142438416.38, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.52, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04327884316444397, "optim/lr": 3.158094501623743e-05, "optim/total_tokens": 1930201923584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3157562017440796, "created_at": "2025-06-03T03:36:21.183726+00:00"} {"global_step": 230099, "acc_step": 0, "speed/wps": 5517.605789218841, "speed/FLOPS": 243849934216874.47, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.0442989207804203, "optim/lr": 3.157739779114288e-05, "optim/total_tokens": 1930210312192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3109707832336426, "created_at": "2025-06-03T03:36:24.160581+00:00"} {"global_step": 230100, "acc_step": 0, "speed/wps": 5519.997091362552, "speed/FLOPS": 243955617531832.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.051778484135866165, "optim/lr": 3.1573850566048337e-05, "optim/total_tokens": 1930218700800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3221759796142578, "created_at": "2025-06-03T03:36:27.133762+00:00"} {"global_step": 230101, "acc_step": 0, "speed/wps": 5538.801301766843, "speed/FLOPS": 244786667383028.2, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.02, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04049907997250557, "optim/lr": 3.157030334095401e-05, "optim/total_tokens": 1930227089408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3045631647109985, "created_at": "2025-06-03T03:36:30.097268+00:00"} {"global_step": 230102, "acc_step": 0, "speed/wps": 5534.662712281119, "speed/FLOPS": 244603762910980.5, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.11, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.051892247051000595, "optim/lr": 3.156675611585946e-05, "optim/total_tokens": 1930235478016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2993184328079224, "created_at": "2025-06-03T03:36:33.062367+00:00"} {"global_step": 230103, "acc_step": 0, "speed/wps": 5526.594179921749, "speed/FLOPS": 244247175079188.75, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.43, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04230154678225517, "optim/lr": 3.156320889076492e-05, "optim/total_tokens": 1930243866624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3297204971313477, "created_at": "2025-06-03T03:36:36.036423+00:00"} {"global_step": 230104, "acc_step": 0, "speed/wps": 5508.614046912365, "speed/FLOPS": 243452545230837.5, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.35 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.35, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04574139416217804, "optim/lr": 3.155966166567059e-05, "optim/total_tokens": 1930252255232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.309483289718628, "created_at": "2025-06-03T03:36:39.015717+00:00"} {"global_step": 230105, "acc_step": 0, "speed/wps": 5541.229675165555, "speed/FLOPS": 244893989057709.47, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 188.94, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04497325420379639, "optim/lr": 3.155611444057604e-05, "optim/total_tokens": 1930260643840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2928791046142578, "created_at": "2025-06-03T03:36:41.977008+00:00"} {"global_step": 230106, "acc_step": 0, "speed/wps": 5521.815746801174, "speed/FLOPS": 244035992793497.25, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040831275284290314, "optim/lr": 3.15525672154815e-05, "optim/total_tokens": 1930269032448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.31751549243927, "created_at": "2025-06-03T03:36:44.950557+00:00"} {"global_step": 230107, "acc_step": 0, "speed/wps": 5522.631771607091, "speed/FLOPS": 244072056913125.2, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.58, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04133777320384979, "optim/lr": 3.154901999038695e-05, "optim/total_tokens": 1930277421056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3107073307037354, "created_at": "2025-06-03T03:36:47.924042+00:00"} {"global_step": 230108, "acc_step": 0, "speed/wps": 5520.900420456261, "speed/FLOPS": 243995540054117.03, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04467596858739853, "optim/lr": 3.154547276529263e-05, "optim/total_tokens": 1930285809664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.316908359527588, "created_at": "2025-06-03T03:36:50.896492+00:00"} {"global_step": 230109, "acc_step": 0, "speed/wps": 5520.574777588369, "speed/FLOPS": 243981148306147.53, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0021, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.46, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.05414614826440811, "optim/lr": 3.154192554019808e-05, "optim/total_tokens": 1930294198272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.302505612373352, "created_at": "2025-06-03T03:36:53.868170+00:00"} {"global_step": 230110, "acc_step": 0, "speed/wps": 5528.933659041072, "speed/FLOPS": 244350568081723.2, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.32, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04061993584036827, "optim/lr": 3.153837831510353e-05, "optim/total_tokens": 1930302586880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3047151565551758, "created_at": "2025-06-03T03:36:56.835173+00:00"} {"global_step": 230111, "acc_step": 0, "speed/wps": 5524.81527645479, "speed/FLOPS": 244168556651202.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04752560704946518, "optim/lr": 3.153483109000899e-05, "optim/total_tokens": 1930310975488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3012772798538208, "created_at": "2025-06-03T03:36:59.807840+00:00"} {"global_step": 230112, "acc_step": 0, "speed/wps": 5507.609144769666, "speed/FLOPS": 243408133699685.7, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04177291691303253, "optim/lr": 3.153128386491466e-05, "optim/total_tokens": 1930319364096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3320399522781372, "created_at": "2025-06-03T03:37:02.788779+00:00"} {"global_step": 230113, "acc_step": 0, "speed/wps": 5521.972149185099, "speed/FLOPS": 244042904978326.75, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.52, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04560358449816704, "optim/lr": 3.152773663982012e-05, "optim/total_tokens": 1930327752704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2955610752105713, "created_at": "2025-06-03T03:37:05.762205+00:00"} {"global_step": 230114, "acc_step": 0, "speed/wps": 5515.127799569293, "speed/FLOPS": 243740419757865.25, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04443968087434769, "optim/lr": 3.152418941472557e-05, "optim/total_tokens": 1930336141312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3015326261520386, "created_at": "2025-06-03T03:37:08.739996+00:00"} {"global_step": 230115, "acc_step": 0, "speed/wps": 5513.315525882632, "speed/FLOPS": 243660326536972.47, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.04050842300057411, "optim/lr": 3.152064218963102e-05, "optim/total_tokens": 1930344529920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.28581964969635, "created_at": "2025-06-03T03:37:11.717777+00:00"} {"global_step": 230116, "acc_step": 0, "speed/wps": 5489.543775083712, "speed/FLOPS": 242609736826510.88, "speed/curr_iter_time": 2.9808, "speed/data_load_time": 0.0022, "speed/curr_step_time": 2.9808, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.36 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.36, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040986429899930954, "optim/lr": 3.15170949645367e-05, "optim/total_tokens": 1930352918528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2984845638275146, "created_at": "2025-06-03T03:37:14.709087+00:00"} {"global_step": 230117, "acc_step": 0, "speed/wps": 5506.233262727062, "speed/FLOPS": 243347326755805.25, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.34 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.34, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.043793804943561554, "optim/lr": 3.151354773944215e-05, "optim/total_tokens": 1930361307136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3024743795394897, "created_at": "2025-06-03T03:37:17.688610+00:00"} {"global_step": 230118, "acc_step": 0, "speed/wps": 5527.616017955101, "speed/FLOPS": 244292335090021.72, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.41, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0415501669049263, "optim/lr": 3.1510000514347606e-05, "optim/total_tokens": 1930369695744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.298708438873291, "created_at": "2025-06-03T03:37:20.662068+00:00"} {"global_step": 230119, "acc_step": 0, "speed/wps": 5516.065377698378, "speed/FLOPS": 243781855912210.9, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.040888238698244095, "optim/lr": 3.1506453289253056e-05, "optim/total_tokens": 1930378084352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3067582845687866, "created_at": "2025-06-03T03:37:23.639572+00:00"} {"global_step": 230120, "acc_step": 0, "speed/wps": 5525.4428304664025, "speed/FLOPS": 244196291326403.2, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04092617332935333, "optim/lr": 3.150290606415873e-05, "optim/total_tokens": 1930386472960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3063068389892578, "created_at": "2025-06-03T03:37:26.609381+00:00"} {"global_step": 230121, "acc_step": 0, "speed/wps": 5519.85400476164, "speed/FLOPS": 243949293836455.84, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04558652639389038, "optim/lr": 3.149935883906419e-05, "optim/total_tokens": 1930394861568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2969279289245605, "created_at": "2025-06-03T03:37:29.581728+00:00"} {"global_step": 230122, "acc_step": 0, "speed/wps": 5522.008894522883, "speed/FLOPS": 244044528934177.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04098797217011452, "optim/lr": 3.149581161396964e-05, "optim/total_tokens": 1930403250176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3040851354599, "created_at": "2025-06-03T03:37:32.553521+00:00"} {"global_step": 230123, "acc_step": 0, "speed/wps": 5519.069903879819, "speed/FLOPS": 243914640590871.53, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04138336703181267, "optim/lr": 3.1492264388875094e-05, "optim/total_tokens": 1930411638784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3193986415863037, "created_at": "2025-06-03T03:37:35.525858+00:00"} {"global_step": 230124, "acc_step": 0, "speed/wps": 5522.255524601569, "speed/FLOPS": 244055428721287.88, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04192524030804634, "optim/lr": 3.148871716378077e-05, "optim/total_tokens": 1930420027392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2822051048278809, "created_at": "2025-06-03T03:37:38.496648+00:00"} {"global_step": 230125, "acc_step": 0, "speed/wps": 5517.264519375738, "speed/FLOPS": 243834851836586.72, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04178277775645256, "optim/lr": 3.148516993868622e-05, "optim/total_tokens": 1930428416000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2861472368240356, "created_at": "2025-06-03T03:37:41.471549+00:00"} {"global_step": 230126, "acc_step": 0, "speed/wps": 5534.900868824435, "speed/FLOPS": 244614288211199.38, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.11, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04330093041062355, "optim/lr": 3.1481622713591675e-05, "optim/total_tokens": 1930436804608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3002281188964844, "created_at": "2025-06-03T03:37:44.437339+00:00"} {"global_step": 230127, "acc_step": 0, "speed/wps": 5526.025204299889, "speed/FLOPS": 244222029268983.78, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 189.46, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04031745344400406, "optim/lr": 3.1478075488497126e-05, "optim/total_tokens": 1930445193216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3059008121490479, "created_at": "2025-06-03T03:37:47.407763+00:00"} {"global_step": 230128, "acc_step": 0, "speed/wps": 5528.12142102385, "speed/FLOPS": 244314671318773.06, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.4, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043822359293699265, "optim/lr": 3.14745282634028e-05, "optim/total_tokens": 1930453581824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.295376181602478, "created_at": "2025-06-03T03:37:50.377369+00:00"} {"global_step": 230129, "acc_step": 0, "speed/wps": 5528.071039151624, "speed/FLOPS": 244312444697898.44, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.34, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04134746268391609, "optim/lr": 3.1470981038308256e-05, "optim/total_tokens": 1930461970432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3098373413085938, "created_at": "2025-06-03T03:37:53.351067+00:00"} {"global_step": 230130, "acc_step": 0, "speed/wps": 5503.28816079324, "speed/FLOPS": 243217168324728.6, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.33 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.33, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.041500937193632126, "optim/lr": 3.1467433813213707e-05, "optim/total_tokens": 1930470359040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2986687421798706, "created_at": "2025-06-03T03:37:56.334995+00:00"} {"global_step": 230131, "acc_step": 0, "speed/wps": 4302.309147959953, "speed/FLOPS": 190140043125339.25, "speed/curr_iter_time": 3.8071, "speed/data_load_time": 0.0007, "speed/curr_step_time": 3.8071, "speed/est_time_elapsed": "10.14 days", "speed/est_time_remaining": "9.38 hours", "speed/est_time_elapsed_hrs": 243.37, "speed/est_time_elapsed_days": 10.14, "speed/est_time_remaining_hrs": 9.38, "speed/est_time_remaining_days": 0.39, "optim/grad_norm": 0.04007807746529579, "optim/lr": 3.146388658811938e-05, "optim/total_tokens": 1930478747648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.314003825187683, "created_at": "2025-06-03T03:38:00.151928+00:00"} {"global_step": 230132, "acc_step": 0, "speed/wps": 5521.864812301905, "speed/FLOPS": 244038161237489.56, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04172985628247261, "optim/lr": 3.146033936302484e-05, "optim/total_tokens": 1930487136256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.297372817993164, "created_at": "2025-06-03T03:38:03.128895+00:00"} {"global_step": 230133, "acc_step": 0, "speed/wps": 5530.482566310991, "speed/FLOPS": 244419021855027.53, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04160667210817337, "optim/lr": 3.145679213793029e-05, "optim/total_tokens": 1930495524864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2960478067398071, "created_at": "2025-06-03T03:38:06.098284+00:00"} {"global_step": 230134, "acc_step": 0, "speed/wps": 5542.317280115362, "speed/FLOPS": 244942055629624.16, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 188.91, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04248998686671257, "optim/lr": 3.1453244912835745e-05, "optim/total_tokens": 1930503913472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.302463173866272, "created_at": "2025-06-03T03:38:09.062121+00:00"} {"global_step": 230135, "acc_step": 0, "speed/wps": 5524.367761401207, "speed/FLOPS": 244148778776423.84, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.06232188269495964, "optim/lr": 3.144969768774142e-05, "optim/total_tokens": 1930512302080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3141226768493652, "created_at": "2025-06-03T03:38:12.035145+00:00"} {"global_step": 230136, "acc_step": 0, "speed/wps": 5545.838816054223, "speed/FLOPS": 245097689493266.88, "speed/curr_iter_time": 2.9522, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9522, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 188.72, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04394533485174179, "optim/lr": 3.144615046264687e-05, "optim/total_tokens": 1930520690688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.318404197692871, "created_at": "2025-06-03T03:38:14.997014+00:00"} {"global_step": 230137, "acc_step": 0, "speed/wps": 5526.609457066683, "speed/FLOPS": 244247850250799.3, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.45, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04309111461043358, "optim/lr": 3.1442603237552326e-05, "optim/total_tokens": 1930529079296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2975081205368042, "created_at": "2025-06-03T03:38:17.968776+00:00"} {"global_step": 230138, "acc_step": 0, "speed/wps": 5525.9156507512635, "speed/FLOPS": 244217187562880.44, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04618038982152939, "optim/lr": 3.1439056012457776e-05, "optim/total_tokens": 1930537467904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.3024944067001343, "created_at": "2025-06-03T03:38:20.941551+00:00"} {"global_step": 230139, "acc_step": 0, "speed/wps": 5518.961371728958, "speed/FLOPS": 243909844025321.34, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045623019337654114, "optim/lr": 3.1435508787363457e-05, "optim/total_tokens": 1930545856512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3163541555404663, "created_at": "2025-06-03T03:38:23.914218+00:00"} {"global_step": 230140, "acc_step": 0, "speed/wps": 5537.313622926672, "speed/FLOPS": 244720919592923.25, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 189.09, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04271767660975456, "optim/lr": 3.143196156226891e-05, "optim/total_tokens": 1930554245120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.309756875038147, "created_at": "2025-06-03T03:38:26.877879+00:00"} {"global_step": 230141, "acc_step": 0, "speed/wps": 5503.446269164071, "speed/FLOPS": 243224155905447.28, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.32 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.32, "speed/est_time_remaining_days": 0.31, "optim/grad_norm": 0.046367157250642776, "optim/lr": 3.142841433717436e-05, "optim/total_tokens": 1930562633728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3056960105895996, "created_at": "2025-06-03T03:38:29.860890+00:00"} {"global_step": 230142, "acc_step": 0, "speed/wps": 5543.017089793739, "speed/FLOPS": 244972983635457.75, "speed/curr_iter_time": 2.9549, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9549, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 188.9, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04127558693289757, "optim/lr": 3.1424867112079814e-05, "optim/total_tokens": 1930571022336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3082256317138672, "created_at": "2025-06-03T03:38:32.824826+00:00"} {"global_step": 230143, "acc_step": 0, "speed/wps": 5529.512183677451, "speed/FLOPS": 244376135909493.6, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.047427114099264145, "optim/lr": 3.142131988698549e-05, "optim/total_tokens": 1930579410944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3062883615493774, "created_at": "2025-06-03T03:38:35.795225+00:00"} {"global_step": 230144, "acc_step": 0, "speed/wps": 5535.543110520718, "speed/FLOPS": 244642672006884.1, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 189.16, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.048063136637210846, "optim/lr": 3.1417772661890945e-05, "optim/total_tokens": 1930587799552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3128061294555664, "created_at": "2025-06-03T03:38:38.762088+00:00"} {"global_step": 230145, "acc_step": 0, "speed/wps": 5528.231216663185, "speed/FLOPS": 244319523724046.6, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.41, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04084945097565651, "optim/lr": 3.1414225436796395e-05, "optim/total_tokens": 1930596188160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3070807456970215, "created_at": "2025-06-03T03:38:41.732919+00:00"} {"global_step": 230146, "acc_step": 0, "speed/wps": 5526.44468347229, "speed/FLOPS": 244240568101314.88, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.41, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043610237538814545, "optim/lr": 3.1410678211701845e-05, "optim/total_tokens": 1930604576768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.313161015510559, "created_at": "2025-06-03T03:38:44.702405+00:00"} {"global_step": 230147, "acc_step": 0, "speed/wps": 5518.714436789624, "speed/FLOPS": 243898930764930.4, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04352590814232826, "optim/lr": 3.1407130986607526e-05, "optim/total_tokens": 1930612965376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3022592067718506, "created_at": "2025-06-03T03:38:47.681030+00:00"} {"global_step": 230148, "acc_step": 0, "speed/wps": 5513.668723948955, "speed/FLOPS": 243675936083672.34, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04268395155668259, "optim/lr": 3.1403583761512976e-05, "optim/total_tokens": 1930621353984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.318052053451538, "created_at": "2025-06-03T03:38:50.656938+00:00"} {"global_step": 230149, "acc_step": 0, "speed/wps": 5521.678638227388, "speed/FLOPS": 244029933296321.2, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045361585915088654, "optim/lr": 3.140003653641843e-05, "optim/total_tokens": 1930629742592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.311668038368225, "created_at": "2025-06-03T03:38:53.629070+00:00"} {"global_step": 230150, "acc_step": 0, "speed/wps": 5542.038622260959, "speed/FLOPS": 244929740378759.72, "speed/curr_iter_time": 2.9554, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9554, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 188.94, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0508534274995327, "optim/lr": 3.139648931132388e-05, "optim/total_tokens": 1930638131200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3078504800796509, "created_at": "2025-06-03T03:38:56.590184+00:00"} {"global_step": 230151, "acc_step": 0, "speed/wps": 5530.907867878215, "speed/FLOPS": 244437818007408.06, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 189.32, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04147960618138313, "optim/lr": 3.139294208622956e-05, "optim/total_tokens": 1930646519808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3000026941299438, "created_at": "2025-06-03T03:38:59.561340+00:00"} {"global_step": 230152, "acc_step": 0, "speed/wps": 5530.277746331755, "speed/FLOPS": 244409969860308.97, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 189.34, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05004890263080597, "optim/lr": 3.1389394861135014e-05, "optim/total_tokens": 1930654908416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.307440996170044, "created_at": "2025-06-03T03:39:02.531709+00:00"} {"global_step": 230153, "acc_step": 0, "speed/wps": 5522.745815898653, "speed/FLOPS": 244077097087080.62, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.54, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04262533411383629, "optim/lr": 3.1385847636040464e-05, "optim/total_tokens": 1930663297024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.290715217590332, "created_at": "2025-06-03T03:39:05.502951+00:00"} {"global_step": 230154, "acc_step": 0, "speed/wps": 5533.879266040207, "speed/FLOPS": 244569138597173.56, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.22, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05138757452368736, "optim/lr": 3.138230041094592e-05, "optim/total_tokens": 1930671685632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.289147973060608, "created_at": "2025-06-03T03:39:08.467627+00:00"} {"global_step": 230155, "acc_step": 0, "speed/wps": 5520.401846799056, "speed/FLOPS": 243973505650399.9, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0510016605257988, "optim/lr": 3.1378753185851595e-05, "optim/total_tokens": 1930680074240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3009519577026367, "created_at": "2025-06-03T03:39:11.440492+00:00"} {"global_step": 230156, "acc_step": 0, "speed/wps": 5509.893925723704, "speed/FLOPS": 243509109323285.1, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04889177903532982, "optim/lr": 3.1375205960757045e-05, "optim/total_tokens": 1930688462848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2886090278625488, "created_at": "2025-06-03T03:39:14.420629+00:00"} {"global_step": 230157, "acc_step": 0, "speed/wps": 5509.939529592981, "speed/FLOPS": 243511124780885.34, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.054437264800071716, "optim/lr": 3.13716587356625e-05, "optim/total_tokens": 1930696851456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.310626745223999, "created_at": "2025-06-03T03:39:17.398825+00:00"} {"global_step": 230158, "acc_step": 0, "speed/wps": 5521.537835190338, "speed/FLOPS": 244023710522778.88, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04845711961388588, "optim/lr": 3.1368111510568176e-05, "optim/total_tokens": 1930705240064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.308188557624817, "created_at": "2025-06-03T03:39:20.375037+00:00"} {"global_step": 230159, "acc_step": 0, "speed/wps": 5502.134710507466, "speed/FLOPS": 243166191725991.1, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.31 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.31, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05307746306061745, "optim/lr": 3.1364564285473626e-05, "optim/total_tokens": 1930713628672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.317201018333435, "created_at": "2025-06-03T03:39:23.357641+00:00"} {"global_step": 230160, "acc_step": 0, "speed/wps": 5530.337447850612, "speed/FLOPS": 244412608361862.38, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.35, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.053895253688097, "optim/lr": 3.1361017060379083e-05, "optim/total_tokens": 1930722017280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2961612939834595, "created_at": "2025-06-03T03:39:26.324881+00:00"} {"global_step": 230161, "acc_step": 0, "speed/wps": 5528.145387174006, "speed/FLOPS": 244315730499940.03, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.42, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.059986650943756104, "optim/lr": 3.1357469835284534e-05, "optim/total_tokens": 1930730405888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3172839879989624, "created_at": "2025-06-03T03:39:29.292756+00:00"} {"global_step": 230162, "acc_step": 0, "speed/wps": 5533.464757974949, "speed/FLOPS": 244550819462333.78, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.24, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05577462166547775, "optim/lr": 3.1353922610190214e-05, "optim/total_tokens": 1930738794496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.321455717086792, "created_at": "2025-06-03T03:39:32.258673+00:00"} {"global_step": 230163, "acc_step": 0, "speed/wps": 5513.540871708295, "speed/FLOPS": 243670285669042.25, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05907375365495682, "optim/lr": 3.1350375385095664e-05, "optim/total_tokens": 1930747183104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2925549745559692, "created_at": "2025-06-03T03:39:35.235000+00:00"} {"global_step": 230164, "acc_step": 0, "speed/wps": 5531.139673430113, "speed/FLOPS": 244448062626313.6, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.32, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0493672676384449, "optim/lr": 3.1346828160001115e-05, "optim/total_tokens": 1930755571712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2894703149795532, "created_at": "2025-06-03T03:39:38.206833+00:00"} {"global_step": 230165, "acc_step": 0, "speed/wps": 5507.713469234991, "speed/FLOPS": 243412744307072.0, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.057625118643045425, "optim/lr": 3.134328093490657e-05, "optim/total_tokens": 1930763960320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3365821838378906, "created_at": "2025-06-03T03:39:41.186513+00:00"} {"global_step": 230166, "acc_step": 0, "speed/wps": 5505.466118583605, "speed/FLOPS": 243313422911264.16, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05249553173780441, "optim/lr": 3.1339733709812245e-05, "optim/total_tokens": 1930772348928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3117214441299438, "created_at": "2025-06-03T03:39:44.171322+00:00"} {"global_step": 230167, "acc_step": 0, "speed/wps": 5527.300543102434, "speed/FLOPS": 244278392716280.53, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.46, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043446365743875504, "optim/lr": 3.13361864847177e-05, "optim/total_tokens": 1930780737536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3056060075759888, "created_at": "2025-06-03T03:39:47.141856+00:00"} {"global_step": 230168, "acc_step": 0, "speed/wps": 5538.401799045103, "speed/FLOPS": 244769011407567.6, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.08, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.06683028489351273, "optim/lr": 3.133263925962315e-05, "optim/total_tokens": 1930789126144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3156458139419556, "created_at": "2025-06-03T03:39:50.107788+00:00"} {"global_step": 230169, "acc_step": 0, "speed/wps": 5522.449793512278, "speed/FLOPS": 244064014412782.78, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04358141869306564, "optim/lr": 3.13290920345286e-05, "optim/total_tokens": 1930797514752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.32181715965271, "created_at": "2025-06-03T03:39:53.078410+00:00"} {"global_step": 230170, "acc_step": 0, "speed/wps": 5521.78274982481, "speed/FLOPS": 244034534496035.78, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.06258714199066162, "optim/lr": 3.1325544809434284e-05, "optim/total_tokens": 1930805903360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3000363111495972, "created_at": "2025-06-03T03:39:56.049622+00:00"} {"global_step": 230171, "acc_step": 0, "speed/wps": 5502.199807533416, "speed/FLOPS": 243169068681341.3, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04131454974412918, "optim/lr": 3.1321997584339734e-05, "optim/total_tokens": 1930814291968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.302810549736023, "created_at": "2025-06-03T03:39:59.031413+00:00"} {"global_step": 230172, "acc_step": 0, "speed/wps": 5513.056383547791, "speed/FLOPS": 243648873772183.2, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05198859050869942, "optim/lr": 3.131845035924519e-05, "optim/total_tokens": 1930822680576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3117722272872925, "created_at": "2025-06-03T03:40:02.010223+00:00"} {"global_step": 230173, "acc_step": 0, "speed/wps": 5497.8845598834205, "speed/FLOPS": 242978356822651.28, "speed/curr_iter_time": 2.9783, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9783, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0460357703268528, "optim/lr": 3.131490313415064e-05, "optim/total_tokens": 1930831069184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3020308017730713, "created_at": "2025-06-03T03:40:04.998138+00:00"} {"global_step": 230174, "acc_step": 0, "speed/wps": 5511.584367990203, "speed/FLOPS": 243583818218996.44, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05201955884695053, "optim/lr": 3.1311355909056315e-05, "optim/total_tokens": 1930839457792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2961044311523438, "created_at": "2025-06-03T03:40:07.978152+00:00"} {"global_step": 230175, "acc_step": 0, "speed/wps": 5508.360464953115, "speed/FLOPS": 243441338206188.8, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.29 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.29, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041941285133361816, "optim/lr": 3.130780868396177e-05, "optim/total_tokens": 1930847846400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2886632680892944, "created_at": "2025-06-03T03:40:10.960444+00:00"} {"global_step": 230176, "acc_step": 0, "speed/wps": 5526.762803098098, "speed/FLOPS": 244254627360491.72, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044336095452308655, "optim/lr": 3.130426145886722e-05, "optim/total_tokens": 1930856235008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3019402027130127, "created_at": "2025-06-03T03:40:13.932079+00:00"} {"global_step": 230177, "acc_step": 0, "speed/wps": 5533.12541617232, "speed/FLOPS": 244535822291566.38, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.26, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0442778579890728, "optim/lr": 3.130071423377268e-05, "optim/total_tokens": 1930864623616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2998396158218384, "created_at": "2025-06-03T03:40:16.897439+00:00"} {"global_step": 230178, "acc_step": 0, "speed/wps": 5517.5411949906975, "speed/FLOPS": 243847079482613.75, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04223295673727989, "optim/lr": 3.129716700867835e-05, "optim/total_tokens": 1930873012224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3072904348373413, "created_at": "2025-06-03T03:40:19.872648+00:00"} {"global_step": 230179, "acc_step": 0, "speed/wps": 5525.134607572625, "speed/FLOPS": 244182669452126.0, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043466340750455856, "optim/lr": 3.12936197835838e-05, "optim/total_tokens": 1930881400832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.302441120147705, "created_at": "2025-06-03T03:40:22.842548+00:00"} {"global_step": 230180, "acc_step": 0, "speed/wps": 5514.844808124439, "speed/FLOPS": 243727912984484.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.042210113257169724, "optim/lr": 3.129007255848926e-05, "optim/total_tokens": 1930889789440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3081350326538086, "created_at": "2025-06-03T03:40:25.818303+00:00"} {"global_step": 230181, "acc_step": 0, "speed/wps": 5516.107954070916, "speed/FLOPS": 243783737569951.47, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04174448177218437, "optim/lr": 3.128652533339471e-05, "optim/total_tokens": 1930898178048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.307828664779663, "created_at": "2025-06-03T03:40:28.795797+00:00"} {"global_step": 230182, "acc_step": 0, "speed/wps": 5516.596378012356, "speed/FLOPS": 243805323408182.72, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04083111137151718, "optim/lr": 3.1282978108300384e-05, "optim/total_tokens": 1930906566656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.304399013519287, "created_at": "2025-06-03T03:40:31.769356+00:00"} {"global_step": 230183, "acc_step": 0, "speed/wps": 5515.587028258463, "speed/FLOPS": 243760715315381.06, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05566108599305153, "optim/lr": 3.127943088320584e-05, "optim/total_tokens": 1930914955264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3155888319015503, "created_at": "2025-06-03T03:40:34.747743+00:00"} {"global_step": 230184, "acc_step": 0, "speed/wps": 5515.999736844569, "speed/FLOPS": 243778954922452.9, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041676245629787445, "optim/lr": 3.127588365811129e-05, "optim/total_tokens": 1930923343872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3044785261154175, "created_at": "2025-06-03T03:40:37.726844+00:00"} {"global_step": 230185, "acc_step": 0, "speed/wps": 5530.462238366954, "speed/FLOPS": 244418123463948.9, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.37, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05211256071925163, "optim/lr": 3.1272336433016965e-05, "optim/total_tokens": 1930931732480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2955021858215332, "created_at": "2025-06-03T03:40:40.696750+00:00"} {"global_step": 230186, "acc_step": 0, "speed/wps": 5511.8491291036835, "speed/FLOPS": 243595519305042.06, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041768673807382584, "optim/lr": 3.126878920792242e-05, "optim/total_tokens": 1930940121088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.31239652633667, "created_at": "2025-06-03T03:40:43.673010+00:00"} {"global_step": 230187, "acc_step": 0, "speed/wps": 5525.957896773439, "speed/FLOPS": 244219054620825.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.52, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045902106910943985, "optim/lr": 3.126524198282787e-05, "optim/total_tokens": 1930948509696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3013200759887695, "created_at": "2025-06-03T03:40:46.644769+00:00"} {"global_step": 230188, "acc_step": 0, "speed/wps": 5526.203334317397, "speed/FLOPS": 244229901704005.56, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.51, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04396051540970802, "optim/lr": 3.126169475773333e-05, "optim/total_tokens": 1930956898304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3042997121810913, "created_at": "2025-06-03T03:40:49.613355+00:00"} {"global_step": 230189, "acc_step": 0, "speed/wps": 5510.652582975607, "speed/FLOPS": 243542638090659.38, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043270573019981384, "optim/lr": 3.1258147532639e-05, "optim/total_tokens": 1930965286912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2926801443099976, "created_at": "2025-06-03T03:40:52.590458+00:00"} {"global_step": 230190, "acc_step": 0, "speed/wps": 5528.737997162752, "speed/FLOPS": 244341920828189.75, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.36, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0410647876560688, "optim/lr": 3.1254600307544453e-05, "optim/total_tokens": 1930973675520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2985203266143799, "created_at": "2025-06-03T03:40:55.557666+00:00"} {"global_step": 230191, "acc_step": 0, "speed/wps": 5519.702641670198, "speed/FLOPS": 243942604362560.66, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04481152817606926, "optim/lr": 3.125105308244991e-05, "optim/total_tokens": 1930982064128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3023676872253418, "created_at": "2025-06-03T03:40:58.532135+00:00"} {"global_step": 230192, "acc_step": 0, "speed/wps": 5522.040431277582, "speed/FLOPS": 244045922697315.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0412578359246254, "optim/lr": 3.124750585735536e-05, "optim/total_tokens": 1930990452736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.30000901222229, "created_at": "2025-06-03T03:41:01.506792+00:00"} {"global_step": 230193, "acc_step": 0, "speed/wps": 5534.700053322702, "speed/FLOPS": 244605413193889.7, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.17, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04262024164199829, "optim/lr": 3.124395863226104e-05, "optim/total_tokens": 1930998841344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3179832696914673, "created_at": "2025-06-03T03:41:04.471040+00:00"} {"global_step": 230194, "acc_step": 0, "speed/wps": 5530.926789280242, "speed/FLOPS": 244438654236529.12, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.35, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0432274304330349, "optim/lr": 3.124041140716649e-05, "optim/total_tokens": 1931007229952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3138408660888672, "created_at": "2025-06-03T03:41:07.440668+00:00"} {"global_step": 230195, "acc_step": 0, "speed/wps": 5520.190773992035, "speed/FLOPS": 243964177312698.16, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04555146396160126, "optim/lr": 3.123686418207194e-05, "optim/total_tokens": 1931015618560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3123373985290527, "created_at": "2025-06-03T03:41:10.414051+00:00"} {"global_step": 230196, "acc_step": 0, "speed/wps": 5526.797531687073, "speed/FLOPS": 244256162186367.4, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04184260591864586, "optim/lr": 3.12333169569774e-05, "optim/total_tokens": 1931024007168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3064936399459839, "created_at": "2025-06-03T03:41:13.383337+00:00"} {"global_step": 230197, "acc_step": 0, "speed/wps": 5514.147448031059, "speed/FLOPS": 243697093237769.38, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.93, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044759366661310196, "optim/lr": 3.122976973188307e-05, "optim/total_tokens": 1931032395776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2948408126831055, "created_at": "2025-06-03T03:41:16.361992+00:00"} {"global_step": 230198, "acc_step": 0, "speed/wps": 5505.973031885633, "speed/FLOPS": 243335825884596.28, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.27 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.27, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.042302194982767105, "optim/lr": 3.122622250678853e-05, "optim/total_tokens": 1931040784384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2981655597686768, "created_at": "2025-06-03T03:41:19.343990+00:00"} {"global_step": 230199, "acc_step": 0, "speed/wps": 5488.5268798137595, "speed/FLOPS": 242564795260520.8, "speed/curr_iter_time": 2.9842, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9842, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "7.3 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 7.3, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040605686604976654, "optim/lr": 3.122267528169398e-05, "optim/total_tokens": 1931049172992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3074085712432861, "created_at": "2025-06-03T03:41:22.335485+00:00"} {"global_step": 230200, "acc_step": 0, "speed/wps": 5519.877585362874, "speed/FLOPS": 243950335978333.94, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0429367870092392, "optim/lr": 3.121912805659943e-05, "optim/total_tokens": 1931057561600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3099780082702637, "created_at": "2025-06-03T03:41:25.307592+00:00"} {"global_step": 230201, "acc_step": 0, "speed/wps": 5513.251711095489, "speed/FLOPS": 243657506250014.4, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041085921227931976, "optim/lr": 3.121558083150511e-05, "optim/total_tokens": 1931065950208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3023892641067505, "created_at": "2025-06-03T03:41:28.285388+00:00"} {"global_step": 230202, "acc_step": 0, "speed/wps": 5520.292684993075, "speed/FLOPS": 243968681257316.34, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04523959383368492, "optim/lr": 3.121203360641056e-05, "optim/total_tokens": 1931074338816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.321366310119629, "created_at": "2025-06-03T03:41:31.257900+00:00"} {"global_step": 230203, "acc_step": 0, "speed/wps": 5521.4823318693, "speed/FLOPS": 244021257560080.75, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.62, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04112422466278076, "optim/lr": 3.120848638131602e-05, "optim/total_tokens": 1931082727424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3057801723480225, "created_at": "2025-06-03T03:41:34.231546+00:00"} {"global_step": 230204, "acc_step": 0, "speed/wps": 5533.517579664221, "speed/FLOPS": 244553153910633.7, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.28, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04841940104961395, "optim/lr": 3.120493915622147e-05, "optim/total_tokens": 1931091116032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2956037521362305, "created_at": "2025-06-03T03:41:37.198271+00:00"} {"global_step": 230205, "acc_step": 0, "speed/wps": 5516.38376557104, "speed/FLOPS": 243795927026525.72, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043940238654613495, "optim/lr": 3.120139193112714e-05, "optim/total_tokens": 1931099504640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.297196388244629, "created_at": "2025-06-03T03:41:40.172718+00:00"} {"global_step": 230206, "acc_step": 0, "speed/wps": 5518.6700430864275, "speed/FLOPS": 243896968790476.7, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045424941927194595, "optim/lr": 3.11978447060326e-05, "optim/total_tokens": 1931107893248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3050813674926758, "created_at": "2025-06-03T03:41:43.145548+00:00"} {"global_step": 230207, "acc_step": 0, "speed/wps": 5516.367885002547, "speed/FLOPS": 243795225186682.44, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04094364494085312, "optim/lr": 3.119429748093805e-05, "optim/total_tokens": 1931116281856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3070937395095825, "created_at": "2025-06-03T03:41:46.119920+00:00"} {"global_step": 230208, "acc_step": 0, "speed/wps": 5525.488565397288, "speed/FLOPS": 244198312576255.72, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.56, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043591734021902084, "optim/lr": 3.1190750255843506e-05, "optim/total_tokens": 1931124670464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3095983266830444, "created_at": "2025-06-03T03:41:49.092718+00:00"} {"global_step": 230209, "acc_step": 0, "speed/wps": 5497.519459965156, "speed/FLOPS": 242962221275014.75, "speed/curr_iter_time": 2.9794, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9794, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.28 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.28, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040001776069402695, "optim/lr": 3.118720303074918e-05, "optim/total_tokens": 1931133059072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3077894449234009, "created_at": "2025-06-03T03:41:52.076668+00:00"} {"global_step": 230210, "acc_step": 0, "speed/wps": 5533.225777812857, "speed/FLOPS": 244540257762380.66, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.23, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04333272948861122, "optim/lr": 3.118365580565463e-05, "optim/total_tokens": 1931141447680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3085790872573853, "created_at": "2025-06-03T03:41:55.044833+00:00"} {"global_step": 230211, "acc_step": 0, "speed/wps": 5525.13101167116, "speed/FLOPS": 244182510531686.75, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04068206250667572, "optim/lr": 3.118010858056009e-05, "optim/total_tokens": 1931149836288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3056321144104004, "created_at": "2025-06-03T03:41:58.015377+00:00"} {"global_step": 230212, "acc_step": 0, "speed/wps": 5519.401820978644, "speed/FLOPS": 243929309627733.84, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04371493682265282, "optim/lr": 3.117656135546576e-05, "optim/total_tokens": 1931158224896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3047200441360474, "created_at": "2025-06-03T03:42:00.990544+00:00"} {"global_step": 230213, "acc_step": 0, "speed/wps": 5511.417765290724, "speed/FLOPS": 243576455232429.38, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04436029866337776, "optim/lr": 3.117301413037121e-05, "optim/total_tokens": 1931166613504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3134160041809082, "created_at": "2025-06-03T03:42:03.968323+00:00"} {"global_step": 230214, "acc_step": 0, "speed/wps": 5529.9483145904505, "speed/FLOPS": 244395410663527.8, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.4, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043599843978881836, "optim/lr": 3.116946690527667e-05, "optim/total_tokens": 1931175002112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3052544593811035, "created_at": "2025-06-03T03:42:06.937640+00:00"} {"global_step": 230215, "acc_step": 0, "speed/wps": 5515.861433077474, "speed/FLOPS": 243772842603850.2, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04332852363586426, "optim/lr": 3.116591968018212e-05, "optim/total_tokens": 1931183390720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.294776201248169, "created_at": "2025-06-03T03:42:09.916337+00:00"} {"global_step": 230216, "acc_step": 0, "speed/wps": 5502.798323461879, "speed/FLOPS": 243195520021897.12, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.26 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.26, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040608782321214676, "optim/lr": 3.116237245508779e-05, "optim/total_tokens": 1931191779328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.308741807937622, "created_at": "2025-06-03T03:42:12.898950+00:00"} {"global_step": 230217, "acc_step": 0, "speed/wps": 5512.978693582805, "speed/FLOPS": 243645440273384.12, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 189.93, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040670689195394516, "optim/lr": 3.115882522999325e-05, "optim/total_tokens": 1931200167936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.301981806755066, "created_at": "2025-06-03T03:42:15.877216+00:00"} {"global_step": 230218, "acc_step": 0, "speed/wps": 5529.633094027814, "speed/FLOPS": 244381479528104.38, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.42, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04199284687638283, "optim/lr": 3.11552780048987e-05, "optim/total_tokens": 1931208556544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3208080530166626, "created_at": "2025-06-03T03:42:18.846202+00:00"} {"global_step": 230219, "acc_step": 0, "speed/wps": 5514.641343565165, "speed/FLOPS": 243718920892390.34, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04463089630007744, "optim/lr": 3.1151730779804156e-05, "optim/total_tokens": 1931216945152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3088912963867188, "created_at": "2025-06-03T03:42:21.821308+00:00"} {"global_step": 230220, "acc_step": 0, "speed/wps": 5525.72733978498, "speed/FLOPS": 244208865182033.62, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.5, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04070742055773735, "optim/lr": 3.114818355470983e-05, "optim/total_tokens": 1931225333760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3037891387939453, "created_at": "2025-06-03T03:42:24.793913+00:00"} {"global_step": 230221, "acc_step": 0, "speed/wps": 5518.72587681453, "speed/FLOPS": 243899436355475.9, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041089702397584915, "optim/lr": 3.114463632961528e-05, "optim/total_tokens": 1931233722368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2937606573104858, "created_at": "2025-06-03T03:42:27.766613+00:00"} {"global_step": 230222, "acc_step": 0, "speed/wps": 5513.998622031463, "speed/FLOPS": 243690515890347.75, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04049668833613396, "optim/lr": 3.114108910452074e-05, "optim/total_tokens": 1931242110976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3069385290145874, "created_at": "2025-06-03T03:42:30.744070+00:00"} {"global_step": 230223, "acc_step": 0, "speed/wps": 5509.8768878866285, "speed/FLOPS": 243508356338093.9, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04168763384222984, "optim/lr": 3.113754187942619e-05, "optim/total_tokens": 1931250499584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3098571300506592, "created_at": "2025-06-03T03:42:33.722100+00:00"} {"global_step": 230224, "acc_step": 0, "speed/wps": 5522.7286313041195, "speed/FLOPS": 244076337615960.97, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04570673033595085, "optim/lr": 3.113399465433187e-05, "optim/total_tokens": 1931258888192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3056918382644653, "created_at": "2025-06-03T03:42:36.695748+00:00"} {"global_step": 230225, "acc_step": 0, "speed/wps": 5522.043039062398, "speed/FLOPS": 244046037948056.1, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04193625599145889, "optim/lr": 3.113044742923732e-05, "optim/total_tokens": 1931267276800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3138606548309326, "created_at": "2025-06-03T03:42:39.668310+00:00"} {"global_step": 230226, "acc_step": 0, "speed/wps": 5529.453809976846, "speed/FLOPS": 244373556090710.56, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04217884689569473, "optim/lr": 3.112690020414277e-05, "optim/total_tokens": 1931275665408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3165698051452637, "created_at": "2025-06-03T03:42:42.637283+00:00"} {"global_step": 230227, "acc_step": 0, "speed/wps": 5519.5393000951035, "speed/FLOPS": 243935385500999.44, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041105806827545166, "optim/lr": 3.1123352979048226e-05, "optim/total_tokens": 1931284054016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2982081174850464, "created_at": "2025-06-03T03:42:45.610595+00:00"} {"global_step": 230228, "acc_step": 0, "speed/wps": 5524.637817552169, "speed/FLOPS": 244160713876023.7, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041130781173706055, "optim/lr": 3.11198057539539e-05, "optim/total_tokens": 1931292442624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3194968700408936, "created_at": "2025-06-03T03:42:48.584136+00:00"} {"global_step": 230229, "acc_step": 0, "speed/wps": 5516.927590643625, "speed/FLOPS": 243819961311184.9, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04173498600721359, "optim/lr": 3.1116258528859356e-05, "optim/total_tokens": 1931300831232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3141838312149048, "created_at": "2025-06-03T03:42:51.561935+00:00"} {"global_step": 230230, "acc_step": 0, "speed/wps": 5524.803213876446, "speed/FLOPS": 244168023546981.6, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.54, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04420285299420357, "optim/lr": 3.111271130376481e-05, "optim/total_tokens": 1931309219840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3099602460861206, "created_at": "2025-06-03T03:42:54.531320+00:00"} {"global_step": 230231, "acc_step": 0, "speed/wps": 5509.745572116246, "speed/FLOPS": 243502552853178.03, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.052051980048418045, "optim/lr": 3.110916407867026e-05, "optim/total_tokens": 1931317608448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3075172901153564, "created_at": "2025-06-03T03:42:57.512420+00:00"} {"global_step": 230232, "acc_step": 0, "speed/wps": 5504.353475679368, "speed/FLOPS": 243264249789919.53, "speed/curr_iter_time": 2.9757, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9757, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.25 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.25, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04073469340801239, "optim/lr": 3.110561685357594e-05, "optim/total_tokens": 1931325997056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2962713241577148, "created_at": "2025-06-03T03:43:00.495975+00:00"} {"global_step": 230233, "acc_step": 0, "speed/wps": 5509.971410555958, "speed/FLOPS": 243512533756267.38, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04646112024784088, "optim/lr": 3.110206962848139e-05, "optim/total_tokens": 1931334385664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2927265167236328, "created_at": "2025-06-03T03:43:03.473606+00:00"} {"global_step": 230234, "acc_step": 0, "speed/wps": 5520.7610465852395, "speed/FLOPS": 243989380442398.03, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04200968146324158, "optim/lr": 3.1098522403386845e-05, "optim/total_tokens": 1931342774272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3152047395706177, "created_at": "2025-06-03T03:43:06.449377+00:00"} {"global_step": 230235, "acc_step": 0, "speed/wps": 5522.453814552677, "speed/FLOPS": 244064192122186.88, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04464920610189438, "optim/lr": 3.1094975178292295e-05, "optim/total_tokens": 1931351162880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3047860860824585, "created_at": "2025-06-03T03:43:09.419928+00:00"} {"global_step": 230236, "acc_step": 0, "speed/wps": 5520.944088990706, "speed/FLOPS": 243997469979823.72, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04124709963798523, "optim/lr": 3.109142795319797e-05, "optim/total_tokens": 1931359551488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3004682064056396, "created_at": "2025-06-03T03:43:12.393458+00:00"} {"global_step": 230237, "acc_step": 0, "speed/wps": 5514.220801931205, "speed/FLOPS": 243700335104696.5, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04524604603648186, "optim/lr": 3.1087880728103426e-05, "optim/total_tokens": 1931367940096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2961007356643677, "created_at": "2025-06-03T03:43:15.368930+00:00"} {"global_step": 230238, "acc_step": 0, "speed/wps": 5509.7633783378515, "speed/FLOPS": 243503339797032.5, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.039956506341695786, "optim/lr": 3.1084333503008876e-05, "optim/total_tokens": 1931376328704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.297890067100525, "created_at": "2025-06-03T03:43:18.349366+00:00"} {"global_step": 230239, "acc_step": 0, "speed/wps": 5517.092596565322, "speed/FLOPS": 243827253728347.06, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04121386259794235, "optim/lr": 3.108078627791455e-05, "optim/total_tokens": 1931384717312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3154608011245728, "created_at": "2025-06-03T03:43:21.322895+00:00"} {"global_step": 230240, "acc_step": 0, "speed/wps": 5513.057757923121, "speed/FLOPS": 243648934512538.1, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04168671742081642, "optim/lr": 3.107723905282001e-05, "optim/total_tokens": 1931393105920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3091528415679932, "created_at": "2025-06-03T03:43:24.300103+00:00"} {"global_step": 230241, "acc_step": 0, "speed/wps": 5509.231128353772, "speed/FLOPS": 243479817072038.56, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043490730226039886, "optim/lr": 3.107369182772546e-05, "optim/total_tokens": 1931401494528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2889318466186523, "created_at": "2025-06-03T03:43:27.283031+00:00"} {"global_step": 230242, "acc_step": 0, "speed/wps": 5506.5402834932775, "speed/FLOPS": 243360895502197.25, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043303459882736206, "optim/lr": 3.1070144602630914e-05, "optim/total_tokens": 1931409883136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2890865802764893, "created_at": "2025-06-03T03:43:30.265098+00:00"} {"global_step": 230243, "acc_step": 0, "speed/wps": 5514.188743873673, "speed/FLOPS": 243698918302641.62, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04326915740966797, "optim/lr": 3.106659737753659e-05, "optim/total_tokens": 1931418271744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3038012981414795, "created_at": "2025-06-03T03:43:33.244440+00:00"} {"global_step": 230244, "acc_step": 0, "speed/wps": 5508.108565823024, "speed/FLOPS": 243430205553975.4, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04755699262022972, "optim/lr": 3.106305015244204e-05, "optim/total_tokens": 1931426660352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3036959171295166, "created_at": "2025-06-03T03:43:36.226231+00:00"} {"global_step": 230245, "acc_step": 0, "speed/wps": 5511.41702023699, "speed/FLOPS": 243576422304867.88, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04478002339601517, "optim/lr": 3.1059502927347495e-05, "optim/total_tokens": 1931435048960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.307447075843811, "created_at": "2025-06-03T03:43:39.202611+00:00"} {"global_step": 230246, "acc_step": 0, "speed/wps": 5513.150887053714, "speed/FLOPS": 243653050343432.2, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0411568246781826, "optim/lr": 3.1055955702252945e-05, "optim/total_tokens": 1931443437568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3109080791473389, "created_at": "2025-06-03T03:43:42.183098+00:00"} {"global_step": 230247, "acc_step": 0, "speed/wps": 5510.669323526819, "speed/FLOPS": 243543377937337.03, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04267682135105133, "optim/lr": 3.105240847715862e-05, "optim/total_tokens": 1931451826176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3041331768035889, "created_at": "2025-06-03T03:43:45.160905+00:00"} {"global_step": 230248, "acc_step": 0, "speed/wps": 5518.999321028305, "speed/FLOPS": 243911521190110.34, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04172328859567642, "optim/lr": 3.1048861252064076e-05, "optim/total_tokens": 1931460214784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3017971515655518, "created_at": "2025-06-03T03:43:48.138606+00:00"} {"global_step": 230249, "acc_step": 0, "speed/wps": 5518.502813106305, "speed/FLOPS": 243889578081315.9, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041443031281232834, "optim/lr": 3.1045314026969526e-05, "optim/total_tokens": 1931468603392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.306070327758789, "created_at": "2025-06-03T03:43:51.116489+00:00"} {"global_step": 230250, "acc_step": 0, "speed/wps": 5512.837241213123, "speed/FLOPS": 243639188802663.03, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044121190905570984, "optim/lr": 3.104176680187498e-05, "optim/total_tokens": 1931476992000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3040828704833984, "created_at": "2025-06-03T03:43:54.092493+00:00"} {"global_step": 230251, "acc_step": 0, "speed/wps": 5499.822549022259, "speed/FLOPS": 243064006023060.3, "speed/curr_iter_time": 2.9781, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9781, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.24 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.24, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04150257632136345, "optim/lr": 3.103821957678066e-05, "optim/total_tokens": 1931485380608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.325186848640442, "created_at": "2025-06-03T03:43:57.075721+00:00"} {"global_step": 230252, "acc_step": 0, "speed/wps": 5507.721737888129, "speed/FLOPS": 243413109739217.9, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.23 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.23, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04133295267820358, "optim/lr": 3.103467235168611e-05, "optim/total_tokens": 1931493769216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.314628005027771, "created_at": "2025-06-03T03:44:00.054762+00:00"} {"global_step": 230253, "acc_step": 0, "speed/wps": 5512.460174017748, "speed/FLOPS": 243622524362632.3, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04182300344109535, "optim/lr": 3.1031125126591564e-05, "optim/total_tokens": 1931502157824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2926779985427856, "created_at": "2025-06-03T03:44:03.032117+00:00"} {"global_step": 230254, "acc_step": 0, "speed/wps": 5513.971305875424, "speed/FLOPS": 243689308656067.6, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 189.93, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.042521167546510696, "optim/lr": 3.1027577901497015e-05, "optim/total_tokens": 1931510546432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.291935682296753, "created_at": "2025-06-03T03:44:06.011597+00:00"} {"global_step": 230255, "acc_step": 0, "speed/wps": 5531.737650277711, "speed/FLOPS": 244474490142254.4, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.38, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04538380727171898, "optim/lr": 3.1024030676402695e-05, "optim/total_tokens": 1931518935040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.293579339981079, "created_at": "2025-06-03T03:44:08.978288+00:00"} {"global_step": 230256, "acc_step": 0, "speed/wps": 5535.748890759575, "speed/FLOPS": 244651766440162.84, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.24, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04101593419909477, "optim/lr": 3.1020483451308145e-05, "optim/total_tokens": 1931527323648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2996729612350464, "created_at": "2025-06-03T03:44:11.942818+00:00"} {"global_step": 230257, "acc_step": 0, "speed/wps": 5505.667232264663, "speed/FLOPS": 243322311106573.78, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.22 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.22, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04038156569004059, "optim/lr": 3.1016936226213596e-05, "optim/total_tokens": 1931535712256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3061316013336182, "created_at": "2025-06-03T03:44:14.923210+00:00"} {"global_step": 230258, "acc_step": 0, "speed/wps": 5515.077786523665, "speed/FLOPS": 243738209437238.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04096410423517227, "optim/lr": 3.101338900111905e-05, "optim/total_tokens": 1931544100864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3067362308502197, "created_at": "2025-06-03T03:44:17.902281+00:00"} {"global_step": 230259, "acc_step": 0, "speed/wps": 5513.980619918846, "speed/FLOPS": 243689720289113.25, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04152334854006767, "optim/lr": 3.1009841776024726e-05, "optim/total_tokens": 1931552489472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3055338859558105, "created_at": "2025-06-03T03:44:20.880566+00:00"} {"global_step": 230260, "acc_step": 0, "speed/wps": 5530.430644462487, "speed/FLOPS": 244416727175083.75, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.36, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04319024831056595, "optim/lr": 3.1006294550930183e-05, "optim/total_tokens": 1931560878080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3014501333236694, "created_at": "2025-06-03T03:44:23.847073+00:00"} {"global_step": 230261, "acc_step": 0, "speed/wps": 5530.618073818739, "speed/FLOPS": 244425010593279.66, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.42, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041715145111083984, "optim/lr": 3.1002747325835634e-05, "optim/total_tokens": 1931569266688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3092950582504272, "created_at": "2025-06-03T03:44:26.814313+00:00"} {"global_step": 230262, "acc_step": 0, "speed/wps": 5526.387759454746, "speed/FLOPS": 244238052351102.94, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0440547838807106, "optim/lr": 3.099920010074109e-05, "optim/total_tokens": 1931577655296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2976527214050293, "created_at": "2025-06-03T03:44:29.787802+00:00"} {"global_step": 230263, "acc_step": 0, "speed/wps": 5519.6740822283555, "speed/FLOPS": 243941342181411.7, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04253876209259033, "optim/lr": 3.0995652875646765e-05, "optim/total_tokens": 1931586043904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3110129833221436, "created_at": "2025-06-03T03:44:32.763448+00:00"} {"global_step": 230264, "acc_step": 0, "speed/wps": 5523.061351465924, "speed/FLOPS": 244091042144096.6, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04588254541158676, "optim/lr": 3.0992105650552215e-05, "optim/total_tokens": 1931594432512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2982428073883057, "created_at": "2025-06-03T03:44:35.737568+00:00"} {"global_step": 230265, "acc_step": 0, "speed/wps": 5512.933327038663, "speed/FLOPS": 243643435304340.06, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04586005210876465, "optim/lr": 3.098855842545767e-05, "optim/total_tokens": 1931602821120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3115545511245728, "created_at": "2025-06-03T03:44:38.713949+00:00"} {"global_step": 230266, "acc_step": 0, "speed/wps": 5516.158320486072, "speed/FLOPS": 243785963507702.66, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04176095128059387, "optim/lr": 3.0985011200363346e-05, "optim/total_tokens": 1931611209728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3096519708633423, "created_at": "2025-06-03T03:44:41.690341+00:00"} {"global_step": 230267, "acc_step": 0, "speed/wps": 5507.231131713763, "speed/FLOPS": 243391427457460.97, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04420856386423111, "optim/lr": 3.0981463975268796e-05, "optim/total_tokens": 1931619598336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3259044885635376, "created_at": "2025-06-03T03:44:44.670357+00:00"} {"global_step": 230268, "acc_step": 0, "speed/wps": 5519.964644384098, "speed/FLOPS": 243954183541463.6, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04266761988401413, "optim/lr": 3.097791675017425e-05, "optim/total_tokens": 1931627986944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2946381568908691, "created_at": "2025-06-03T03:44:47.642478+00:00"} {"global_step": 230269, "acc_step": 0, "speed/wps": 5505.562612273795, "speed/FLOPS": 243317687438471.06, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045947782695293427, "optim/lr": 3.09743695250797e-05, "optim/total_tokens": 1931636375552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2950718402862549, "created_at": "2025-06-03T03:44:50.622611+00:00"} {"global_step": 230270, "acc_step": 0, "speed/wps": 5529.715341776231, "speed/FLOPS": 244385114457602.28, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.4, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04116514325141907, "optim/lr": 3.097082229998538e-05, "optim/total_tokens": 1931644764160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.315346121788025, "created_at": "2025-06-03T03:44:53.591894+00:00"} {"global_step": 230271, "acc_step": 0, "speed/wps": 5518.978000914114, "speed/FLOPS": 243910578950189.38, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0485319159924984, "optim/lr": 3.0967275074890834e-05, "optim/total_tokens": 1931653152768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3096429109573364, "created_at": "2025-06-03T03:44:56.565996+00:00"} {"global_step": 230272, "acc_step": 0, "speed/wps": 5521.705934180053, "speed/FLOPS": 244031139637715.66, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.047096431255340576, "optim/lr": 3.0963727849796284e-05, "optim/total_tokens": 1931661541376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.291374683380127, "created_at": "2025-06-03T03:44:59.537101+00:00"} {"global_step": 230273, "acc_step": 0, "speed/wps": 5521.611512796188, "speed/FLOPS": 244026966695841.28, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04196930304169655, "optim/lr": 3.096018062470174e-05, "optim/total_tokens": 1931669929984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.308152675628662, "created_at": "2025-06-03T03:45:02.510873+00:00"} {"global_step": 230274, "acc_step": 0, "speed/wps": 5509.850255799508, "speed/FLOPS": 243507179336158.56, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04471565783023834, "optim/lr": 3.0956633399607415e-05, "optim/total_tokens": 1931678318592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.298770546913147, "created_at": "2025-06-03T03:45:05.490898+00:00"} {"global_step": 230275, "acc_step": 0, "speed/wps": 5508.318648827908, "speed/FLOPS": 243439490147488.97, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04048803448677063, "optim/lr": 3.0953086174512865e-05, "optim/total_tokens": 1931686707200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2974213361740112, "created_at": "2025-06-03T03:45:08.473099+00:00"} {"global_step": 230276, "acc_step": 0, "speed/wps": 5516.778238257493, "speed/FLOPS": 243813360700172.7, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04476097598671913, "optim/lr": 3.094953894941832e-05, "optim/total_tokens": 1931695095808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2870253324508667, "created_at": "2025-06-03T03:45:11.451430+00:00"} {"global_step": 230277, "acc_step": 0, "speed/wps": 5524.609596944298, "speed/FLOPS": 244159466669601.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041784681379795074, "optim/lr": 3.094599172432377e-05, "optim/total_tokens": 1931703484416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3232299089431763, "created_at": "2025-06-03T03:45:14.423364+00:00"} {"global_step": 230278, "acc_step": 0, "speed/wps": 5516.621251583982, "speed/FLOPS": 243806422692734.12, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045661184936761856, "optim/lr": 3.094244449922945e-05, "optim/total_tokens": 1931711873024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3122855424880981, "created_at": "2025-06-03T03:45:17.400691+00:00"} {"global_step": 230279, "acc_step": 0, "speed/wps": 5523.365665803997, "speed/FLOPS": 244104491280217.44, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04394229128956795, "optim/lr": 3.09388972741349e-05, "optim/total_tokens": 1931720261632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3223720788955688, "created_at": "2025-06-03T03:45:20.376728+00:00"} {"global_step": 230280, "acc_step": 0, "speed/wps": 5510.533458800367, "speed/FLOPS": 243537373411846.56, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04154385253787041, "optim/lr": 3.093535004904035e-05, "optim/total_tokens": 1931728650240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2878570556640625, "created_at": "2025-06-03T03:45:23.357053+00:00"} {"global_step": 230281, "acc_step": 0, "speed/wps": 5519.622551028064, "speed/FLOPS": 243939064766119.4, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041385501623153687, "optim/lr": 3.093180282394581e-05, "optim/total_tokens": 1931737038848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3078687191009521, "created_at": "2025-06-03T03:45:26.330159+00:00"} {"global_step": 230282, "acc_step": 0, "speed/wps": 5523.1160676565, "speed/FLOPS": 244093460319657.16, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04089725390076637, "optim/lr": 3.0928255598851484e-05, "optim/total_tokens": 1931745427456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.3120561838150024, "created_at": "2025-06-03T03:45:29.305814+00:00"} {"global_step": 230283, "acc_step": 0, "speed/wps": 5509.71374984839, "speed/FLOPS": 243501146471819.94, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04174397513270378, "optim/lr": 3.092470837375694e-05, "optim/total_tokens": 1931753816064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3167179822921753, "created_at": "2025-06-03T03:45:32.288475+00:00"} {"global_step": 230284, "acc_step": 0, "speed/wps": 5503.890905866486, "speed/FLOPS": 243243806571837.06, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045842476189136505, "optim/lr": 3.092116114866239e-05, "optim/total_tokens": 1931762204672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2867571115493774, "created_at": "2025-06-03T03:45:35.269180+00:00"} {"global_step": 230285, "acc_step": 0, "speed/wps": 5526.093091509836, "speed/FLOPS": 244225029536185.22, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040754206478595734, "optim/lr": 3.091761392356784e-05, "optim/total_tokens": 1931770593280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3071786165237427, "created_at": "2025-06-03T03:45:38.237898+00:00"} {"global_step": 230286, "acc_step": 0, "speed/wps": 5528.783192848811, "speed/FLOPS": 244343918246181.06, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 189.5, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04596283659338951, "optim/lr": 3.091406669847352e-05, "optim/total_tokens": 1931778981888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3149089813232422, "created_at": "2025-06-03T03:45:41.207320+00:00"} {"global_step": 230287, "acc_step": 0, "speed/wps": 5520.625303567703, "speed/FLOPS": 243983381295818.66, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04109586030244827, "optim/lr": 3.091051947337897e-05, "optim/total_tokens": 1931787370496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2996577024459839, "created_at": "2025-06-03T03:45:44.185037+00:00"} {"global_step": 230288, "acc_step": 0, "speed/wps": 5521.929197118522, "speed/FLOPS": 244041006716832.7, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04285937547683716, "optim/lr": 3.090697224828443e-05, "optim/total_tokens": 1931795759104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3042089939117432, "created_at": "2025-06-03T03:45:47.159712+00:00"} {"global_step": 230289, "acc_step": 0, "speed/wps": 5515.721407752065, "speed/FLOPS": 243766654201181.66, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04321007803082466, "optim/lr": 3.090342502318988e-05, "optim/total_tokens": 1931804147712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.300632119178772, "created_at": "2025-06-03T03:45:50.137272+00:00"} {"global_step": 230290, "acc_step": 0, "speed/wps": 5514.473620846921, "speed/FLOPS": 243711508406726.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04224545136094093, "optim/lr": 3.0899877798095553e-05, "optim/total_tokens": 1931812536320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2980976104736328, "created_at": "2025-06-03T03:45:53.113779+00:00"} {"global_step": 230291, "acc_step": 0, "speed/wps": 5502.124318753416, "speed/FLOPS": 243165732463651.94, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04223978891968727, "optim/lr": 3.089633057300101e-05, "optim/total_tokens": 1931820924928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3152763843536377, "created_at": "2025-06-03T03:45:56.096152+00:00"} {"global_step": 230292, "acc_step": 0, "speed/wps": 5498.66097137398, "speed/FLOPS": 243012670236499.72, "speed/curr_iter_time": 2.9787, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9787, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.21 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.21, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041347406804561615, "optim/lr": 3.089278334790646e-05, "optim/total_tokens": 1931829313536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2964242696762085, "created_at": "2025-06-03T03:45:59.083834+00:00"} {"global_step": 230293, "acc_step": 0, "speed/wps": 5516.19781907076, "speed/FLOPS": 243787709142973.78, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04090866819024086, "optim/lr": 3.0889236122812135e-05, "optim/total_tokens": 1931837702144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3088202476501465, "created_at": "2025-06-03T03:46:02.058598+00:00"} {"global_step": 230294, "acc_step": 0, "speed/wps": 5514.199456065552, "speed/FLOPS": 243699391726692.72, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04435558617115021, "optim/lr": 3.088568889771759e-05, "optim/total_tokens": 1931846090752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3038723468780518, "created_at": "2025-06-03T03:46:05.036762+00:00"} {"global_step": 230295, "acc_step": 0, "speed/wps": 5524.61336349222, "speed/FLOPS": 244159633131741.16, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04320415481925011, "optim/lr": 3.088214167262304e-05, "optim/total_tokens": 1931854479360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3144093751907349, "created_at": "2025-06-03T03:46:08.012356+00:00"} {"global_step": 230296, "acc_step": 0, "speed/wps": 5514.478318686606, "speed/FLOPS": 243711716027195.0, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.042036812752485275, "optim/lr": 3.08785944475285e-05, "optim/total_tokens": 1931862867968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3170675039291382, "created_at": "2025-06-03T03:46:10.990167+00:00"} {"global_step": 230297, "acc_step": 0, "speed/wps": 5517.870025409235, "speed/FLOPS": 243861612104006.44, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04159625992178917, "optim/lr": 3.087504722243417e-05, "optim/total_tokens": 1931871256576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2965892553329468, "created_at": "2025-06-03T03:46:13.965164+00:00"} {"global_step": 230298, "acc_step": 0, "speed/wps": 5526.415174466585, "speed/FLOPS": 244239263954303.5, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04073767736554146, "optim/lr": 3.087149999733962e-05, "optim/total_tokens": 1931879645184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.3045868873596191, "created_at": "2025-06-03T03:46:16.935880+00:00"} {"global_step": 230299, "acc_step": 0, "speed/wps": 5499.637662302529, "speed/FLOPS": 243055834976384.25, "speed/curr_iter_time": 2.9782, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9782, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.2 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.2, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04095965623855591, "optim/lr": 3.086795277224508e-05, "optim/total_tokens": 1931888033792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2945752143859863, "created_at": "2025-06-03T03:46:19.922640+00:00"} {"global_step": 230300, "acc_step": 0, "speed/wps": 5506.804334826418, "speed/FLOPS": 243372565219584.84, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04113159328699112, "optim/lr": 3.086440554715053e-05, "optim/total_tokens": 1931896422400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3012257814407349, "created_at": "2025-06-03T03:46:22.901754+00:00"} {"global_step": 230301, "acc_step": 0, "speed/wps": 5507.467599261977, "speed/FLOPS": 243401878112741.38, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04198739305138588, "optim/lr": 3.0860858322056204e-05, "optim/total_tokens": 1931904811008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3153386116027832, "created_at": "2025-06-03T03:46:25.880434+00:00"} {"global_step": 230302, "acc_step": 0, "speed/wps": 5528.30121933837, "speed/FLOPS": 244322617483983.62, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.54, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044400643557310104, "optim/lr": 3.085731109696166e-05, "optim/total_tokens": 1931913199616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2945643663406372, "created_at": "2025-06-03T03:46:28.847939+00:00"} {"global_step": 230303, "acc_step": 0, "speed/wps": 5524.797347220231, "speed/FLOPS": 244167764270805.2, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04387207701802254, "optim/lr": 3.085376387186711e-05, "optim/total_tokens": 1931921588224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.292600154876709, "created_at": "2025-06-03T03:46:31.818540+00:00"} {"global_step": 230304, "acc_step": 0, "speed/wps": 5511.0313032687545, "speed/FLOPS": 243559375589150.28, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04417960345745087, "optim/lr": 3.085021664677257e-05, "optim/total_tokens": 1931929976832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3003767728805542, "created_at": "2025-06-03T03:46:34.796396+00:00"} {"global_step": 230305, "acc_step": 0, "speed/wps": 5502.903624637911, "speed/FLOPS": 243200173794897.5, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0412859208881855, "optim/lr": 3.084666942167824e-05, "optim/total_tokens": 1931938365440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3163081407546997, "created_at": "2025-06-03T03:46:37.780853+00:00"} {"global_step": 230306, "acc_step": 0, "speed/wps": 5516.789835041648, "speed/FLOPS": 243813873218674.62, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04764816164970398, "optim/lr": 3.084312219658369e-05, "optim/total_tokens": 1931946754048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3142342567443848, "created_at": "2025-06-03T03:46:40.758800+00:00"} {"global_step": 230307, "acc_step": 0, "speed/wps": 5503.37808718296, "speed/FLOPS": 243221142610869.22, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.18 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.18, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04542139545083046, "optim/lr": 3.083957497148915e-05, "optim/total_tokens": 1931955142656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3109257221221924, "created_at": "2025-06-03T03:46:43.744255+00:00"} {"global_step": 230308, "acc_step": 0, "speed/wps": 5517.616105849632, "speed/FLOPS": 243850390159150.12, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04235682263970375, "optim/lr": 3.08360277463946e-05, "optim/total_tokens": 1931963531264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3024704456329346, "created_at": "2025-06-03T03:46:46.719532+00:00"} {"global_step": 230309, "acc_step": 0, "speed/wps": 5500.342316334252, "speed/FLOPS": 243086977077840.12, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.19 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.19, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04747159034013748, "optim/lr": 3.083248052130028e-05, "optim/total_tokens": 1931971919872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2949897050857544, "created_at": "2025-06-03T03:46:49.704960+00:00"} {"global_step": 230310, "acc_step": 0, "speed/wps": 5511.758612238264, "speed/FLOPS": 243591518922897.8, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04067159816622734, "optim/lr": 3.082893329620573e-05, "optim/total_tokens": 1931980308480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3008522987365723, "created_at": "2025-06-03T03:46:52.681704+00:00"} {"global_step": 230311, "acc_step": 0, "speed/wps": 5525.256193356395, "speed/FLOPS": 244188042921436.2, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.58, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044283512979745865, "optim/lr": 3.082538607111118e-05, "optim/total_tokens": 1931988697088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.297363519668579, "created_at": "2025-06-03T03:46:55.654643+00:00"} {"global_step": 230312, "acc_step": 0, "speed/wps": 5520.23166413074, "speed/FLOPS": 243965984447534.2, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.046183545142412186, "optim/lr": 3.082183884601664e-05, "optim/total_tokens": 1931997085696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3026957511901855, "created_at": "2025-06-03T03:46:58.629030+00:00"} {"global_step": 230313, "acc_step": 0, "speed/wps": 5514.788080464258, "speed/FLOPS": 243725405912262.72, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041846856474876404, "optim/lr": 3.081829162092231e-05, "optim/total_tokens": 1932005474304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3133714199066162, "created_at": "2025-06-03T03:47:01.605448+00:00"} {"global_step": 230314, "acc_step": 0, "speed/wps": 5519.711719636638, "speed/FLOPS": 243943005562212.06, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.048960719257593155, "optim/lr": 3.081474439582777e-05, "optim/total_tokens": 1932013862912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2809687852859497, "created_at": "2025-06-03T03:47:04.577464+00:00"} {"global_step": 230315, "acc_step": 0, "speed/wps": 5516.902956090744, "speed/FLOPS": 243818872590038.62, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05023619532585144, "optim/lr": 3.081119717073322e-05, "optim/total_tokens": 1932022251520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2960102558135986, "created_at": "2025-06-03T03:47:07.554615+00:00"} {"global_step": 230316, "acc_step": 0, "speed/wps": 5527.202915608983, "speed/FLOPS": 244274078080772.8, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0411539226770401, "optim/lr": 3.080764994563867e-05, "optim/total_tokens": 1932030640128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2907088994979858, "created_at": "2025-06-03T03:47:10.526239+00:00"} {"global_step": 230317, "acc_step": 0, "speed/wps": 5514.566411469265, "speed/FLOPS": 243715609277288.8, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0467408262193203, "optim/lr": 3.080410272054435e-05, "optim/total_tokens": 1932039028736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3156360387802124, "created_at": "2025-06-03T03:47:13.504098+00:00"} {"global_step": 230318, "acc_step": 0, "speed/wps": 5520.411403447966, "speed/FLOPS": 243973928005366.38, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04164294898509979, "optim/lr": 3.08005554954498e-05, "optim/total_tokens": 1932047417344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2974191904067993, "created_at": "2025-06-03T03:47:16.478982+00:00"} {"global_step": 230319, "acc_step": 0, "speed/wps": 5526.55806452618, "speed/FLOPS": 244245578963559.97, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04159469157457352, "optim/lr": 3.0797008270355256e-05, "optim/total_tokens": 1932055805952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3077508211135864, "created_at": "2025-06-03T03:47:19.451882+00:00"} {"global_step": 230320, "acc_step": 0, "speed/wps": 5516.758766945724, "speed/FLOPS": 243812500167855.72, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0415782667696476, "optim/lr": 3.079346104526093e-05, "optim/total_tokens": 1932064194560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.321053385734558, "created_at": "2025-06-03T03:47:22.426082+00:00"} {"global_step": 230321, "acc_step": 0, "speed/wps": 5536.898575831663, "speed/FLOPS": 244702576635727.47, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.18, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04027298092842102, "optim/lr": 3.078991382016638e-05, "optim/total_tokens": 1932072583168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3101370334625244, "created_at": "2025-06-03T03:47:25.389022+00:00"} {"global_step": 230322, "acc_step": 0, "speed/wps": 5519.954982763107, "speed/FLOPS": 243953756547268.44, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04232734814286232, "optim/lr": 3.078636659507184e-05, "optim/total_tokens": 1932080971776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2951170206069946, "created_at": "2025-06-03T03:47:28.360707+00:00"} {"global_step": 230323, "acc_step": 0, "speed/wps": 5513.201301421279, "speed/FLOPS": 243655278400434.44, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04259764403104782, "optim/lr": 3.078281936997729e-05, "optim/total_tokens": 1932089360384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3056477308273315, "created_at": "2025-06-03T03:47:31.336327+00:00"} {"global_step": 230324, "acc_step": 0, "speed/wps": 5520.4482566419865, "speed/FLOPS": 243975556727910.3, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04267886281013489, "optim/lr": 3.077927214488296e-05, "optim/total_tokens": 1932097748992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2995326519012451, "created_at": "2025-06-03T03:47:34.311821+00:00"} {"global_step": 230325, "acc_step": 0, "speed/wps": 5508.346881326138, "speed/FLOPS": 243440737879403.72, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.17 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.17, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0432429239153862, "optim/lr": 3.077572491978842e-05, "optim/total_tokens": 1932106137600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3054544925689697, "created_at": "2025-06-03T03:47:37.291170+00:00"} {"global_step": 230326, "acc_step": 0, "speed/wps": 5512.189872239203, "speed/FLOPS": 243610578407550.56, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04071487486362457, "optim/lr": 3.077217769469387e-05, "optim/total_tokens": 1932114526208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3189713954925537, "created_at": "2025-06-03T03:47:40.268491+00:00"} {"global_step": 230327, "acc_step": 0, "speed/wps": 5525.7781835918595, "speed/FLOPS": 244211112218055.5, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04236391559243202, "optim/lr": 3.0768630469599326e-05, "optim/total_tokens": 1932122914816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2928788661956787, "created_at": "2025-06-03T03:47:43.239252+00:00"} {"global_step": 230328, "acc_step": 0, "speed/wps": 5522.923441963262, "speed/FLOPS": 244084947249963.75, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04108770936727524, "optim/lr": 3.0765083244505e-05, "optim/total_tokens": 1932131303424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3033610582351685, "created_at": "2025-06-03T03:47:46.213536+00:00"} {"global_step": 230329, "acc_step": 0, "speed/wps": 5521.251094626708, "speed/FLOPS": 244011038057537.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04097438603639603, "optim/lr": 3.076153601941045e-05, "optim/total_tokens": 1932139692032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3030728101730347, "created_at": "2025-06-03T03:47:49.184437+00:00"} {"global_step": 230330, "acc_step": 0, "speed/wps": 5525.452656653016, "speed/FLOPS": 244196725593556.5, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041186828166246414, "optim/lr": 3.075798879431591e-05, "optim/total_tokens": 1932148080640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3052685260772705, "created_at": "2025-06-03T03:47:52.154157+00:00"} {"global_step": 230331, "acc_step": 0, "speed/wps": 5528.199097988578, "speed/FLOPS": 244318104243027.25, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.51, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04202628880739212, "optim/lr": 3.075444156922136e-05, "optim/total_tokens": 1932156469248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.309544563293457, "created_at": "2025-06-03T03:47:55.124393+00:00"} {"global_step": 230332, "acc_step": 0, "speed/wps": 5527.346030926977, "speed/FLOPS": 244280403045297.53, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.59, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040234096348285675, "optim/lr": 3.075089434412703e-05, "optim/total_tokens": 1932164857856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2971135377883911, "created_at": "2025-06-03T03:47:58.092311+00:00"} {"global_step": 230333, "acc_step": 0, "speed/wps": 5520.374911492649, "speed/FLOPS": 243972315247724.1, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045756611973047256, "optim/lr": 3.074734711903249e-05, "optim/total_tokens": 1932173246464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3067290782928467, "created_at": "2025-06-03T03:48:01.064167+00:00"} {"global_step": 230334, "acc_step": 0, "speed/wps": 5525.276748122785, "speed/FLOPS": 244188951336901.78, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04287489131093025, "optim/lr": 3.074379989393794e-05, "optim/total_tokens": 1932181635072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3131115436553955, "created_at": "2025-06-03T03:48:04.036565+00:00"} {"global_step": 230335, "acc_step": 0, "speed/wps": 5519.02869635101, "speed/FLOPS": 243912819429017.4, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04210563004016876, "optim/lr": 3.0740252668843395e-05, "optim/total_tokens": 1932190023680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3118373155593872, "created_at": "2025-06-03T03:48:07.009855+00:00"} {"global_step": 230336, "acc_step": 0, "speed/wps": 5531.5372268635565, "speed/FLOPS": 244465632453208.84, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.45, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04131351783871651, "optim/lr": 3.073670544374907e-05, "optim/total_tokens": 1932198412288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.3102115392684937, "created_at": "2025-06-03T03:48:09.975384+00:00"} {"global_step": 230337, "acc_step": 0, "speed/wps": 5530.574938896107, "speed/FLOPS": 244423104250483.88, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04316132143139839, "optim/lr": 3.073315821865452e-05, "optim/total_tokens": 1932206800896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3116306066513062, "created_at": "2025-06-03T03:48:12.941548+00:00"} {"global_step": 230338, "acc_step": 0, "speed/wps": 5532.711491704975, "speed/FLOPS": 244517528948767.22, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.35, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04099264740943909, "optim/lr": 3.0729610993559976e-05, "optim/total_tokens": 1932215189504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3038409948349, "created_at": "2025-06-03T03:48:15.910248+00:00"} {"global_step": 230339, "acc_step": 0, "speed/wps": 5518.930628041212, "speed/FLOPS": 243908485311683.44, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044466398656368256, "optim/lr": 3.0726063768465426e-05, "optim/total_tokens": 1932223578112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2962026596069336, "created_at": "2025-06-03T03:48:18.883615+00:00"} {"global_step": 230340, "acc_step": 0, "speed/wps": 5515.5229101381965, "speed/FLOPS": 243757881622651.56, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04273166507482529, "optim/lr": 3.072251654337111e-05, "optim/total_tokens": 1932231966720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3013509511947632, "created_at": "2025-06-03T03:48:21.861108+00:00"} {"global_step": 230341, "acc_step": 0, "speed/wps": 5500.298884530016, "speed/FLOPS": 243085057614397.0, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.16 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.16, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.043141789734363556, "optim/lr": 3.071896931827656e-05, "optim/total_tokens": 1932240355328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.313486933708191, "created_at": "2025-06-03T03:48:24.843874+00:00"} {"global_step": 230342, "acc_step": 0, "speed/wps": 5511.538653574448, "speed/FLOPS": 243581797875807.7, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.15 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.15, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04200247675180435, "optim/lr": 3.071542209318201e-05, "optim/total_tokens": 1932248743936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3074491024017334, "created_at": "2025-06-03T03:48:27.820929+00:00"} {"global_step": 230343, "acc_step": 0, "speed/wps": 5517.091316204562, "speed/FLOPS": 243827197142954.94, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04296291619539261, "optim/lr": 3.0711874868087464e-05, "optim/total_tokens": 1932257132544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3188941478729248, "created_at": "2025-06-03T03:48:30.793853+00:00"} {"global_step": 230344, "acc_step": 0, "speed/wps": 5537.677554111336, "speed/FLOPS": 244737003488516.72, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.19, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.046383585780858994, "optim/lr": 3.070832764299314e-05, "optim/total_tokens": 1932265521152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.307267427444458, "created_at": "2025-06-03T03:48:33.758589+00:00"} {"global_step": 230345, "acc_step": 0, "speed/wps": 5528.781869698711, "speed/FLOPS": 244343859769719.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041634634137153625, "optim/lr": 3.0704780417898595e-05, "optim/total_tokens": 1932273909760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3138184547424316, "created_at": "2025-06-03T03:48:36.730029+00:00"} {"global_step": 230346, "acc_step": 0, "speed/wps": 5535.032458639158, "speed/FLOPS": 244620103807472.4, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.34, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04996292293071747, "optim/lr": 3.0701233192804045e-05, "optim/total_tokens": 1932282298368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2975914478302002, "created_at": "2025-06-03T03:48:39.698112+00:00"} {"global_step": 230347, "acc_step": 0, "speed/wps": 5524.009656718028, "speed/FLOPS": 244132952382373.28, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041271813213825226, "optim/lr": 3.069768596770972e-05, "optim/total_tokens": 1932290686976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3030869960784912, "created_at": "2025-06-03T03:48:42.669517+00:00"} {"global_step": 230348, "acc_step": 0, "speed/wps": 5522.226257494346, "speed/FLOPS": 244054135264951.25, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.13 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.13, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04465677589178085, "optim/lr": 3.0694138742615176e-05, "optim/total_tokens": 1932299075584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2907958030700684, "created_at": "2025-06-03T03:48:45.640477+00:00"} {"global_step": 230349, "acc_step": 0, "speed/wps": 5511.014322705579, "speed/FLOPS": 243558625135172.3, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04127108305692673, "optim/lr": 3.0690591517520626e-05, "optim/total_tokens": 1932307464192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3151006698608398, "created_at": "2025-06-03T03:48:48.617060+00:00"} {"global_step": 230350, "acc_step": 0, "speed/wps": 5510.348498503669, "speed/FLOPS": 243529199113445.16, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04311668500304222, "optim/lr": 3.0687044292426083e-05, "optim/total_tokens": 1932315852800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.298998475074768, "created_at": "2025-06-03T03:48:51.597601+00:00"} {"global_step": 230351, "acc_step": 0, "speed/wps": 5512.894272103298, "speed/FLOPS": 243641709276098.22, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041734229773283005, "optim/lr": 3.068349706733176e-05, "optim/total_tokens": 1932324241408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2967166900634766, "created_at": "2025-06-03T03:48:54.576423+00:00"} {"global_step": 230352, "acc_step": 0, "speed/wps": 5533.792958635225, "speed/FLOPS": 244565324251634.72, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.39, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04216335713863373, "optim/lr": 3.067994984223721e-05, "optim/total_tokens": 1932332630016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.316352367401123, "created_at": "2025-06-03T03:48:57.542627+00:00"} {"global_step": 230353, "acc_step": 0, "speed/wps": 5535.859515680338, "speed/FLOPS": 244656655495430.84, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.32, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04591357707977295, "optim/lr": 3.0676402617142664e-05, "optim/total_tokens": 1932341018624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.300294041633606, "created_at": "2025-06-03T03:49:00.512136+00:00"} {"global_step": 230354, "acc_step": 0, "speed/wps": 5536.203579420092, "speed/FLOPS": 244671861351650.12, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04089393466711044, "optim/lr": 3.0672855392048115e-05, "optim/total_tokens": 1932349407232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3063628673553467, "created_at": "2025-06-03T03:49:03.478310+00:00"} {"global_step": 230355, "acc_step": 0, "speed/wps": 5519.695216351414, "speed/FLOPS": 243942276201476.66, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05941376835107803, "optim/lr": 3.066930816695379e-05, "optim/total_tokens": 1932357795840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3058339357376099, "created_at": "2025-06-03T03:49:06.452091+00:00"} {"global_step": 230356, "acc_step": 0, "speed/wps": 5521.438183892216, "speed/FLOPS": 244019306445463.47, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04551500454545021, "optim/lr": 3.0665760941859246e-05, "optim/total_tokens": 1932366184448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2981963157653809, "created_at": "2025-06-03T03:49:09.423288+00:00"} {"global_step": 230357, "acc_step": 0, "speed/wps": 5525.839828759069, "speed/FLOPS": 244213836618917.6, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.67, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05159851536154747, "optim/lr": 3.0662213716764696e-05, "optim/total_tokens": 1932374573056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3212887048721313, "created_at": "2025-06-03T03:49:12.392180+00:00"} {"global_step": 230358, "acc_step": 0, "speed/wps": 5525.104964192181, "speed/FLOPS": 244181359366438.97, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05214550718665123, "optim/lr": 3.065866649167015e-05, "optim/total_tokens": 1932382961664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2902518510818481, "created_at": "2025-06-03T03:49:15.362436+00:00"} {"global_step": 230359, "acc_step": 0, "speed/wps": 5526.779346936767, "speed/FLOPS": 244255358513481.88, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044561538845300674, "optim/lr": 3.0655119266575827e-05, "optim/total_tokens": 1932391350272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3137102127075195, "created_at": "2025-06-03T03:49:18.335098+00:00"} {"global_step": 230360, "acc_step": 0, "speed/wps": 5535.919991913916, "speed/FLOPS": 244659328235409.62, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.32, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05493113398551941, "optim/lr": 3.065157204148128e-05, "optim/total_tokens": 1932399738880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3188616037368774, "created_at": "2025-06-03T03:49:21.302331+00:00"} {"global_step": 230361, "acc_step": 0, "speed/wps": 5502.221877165304, "speed/FLOPS": 243170044046108.16, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0022, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.14 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.14, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04120536893606186, "optim/lr": 3.0648024816386734e-05, "optim/total_tokens": 1932408127488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 355, "loss/out": 1.3138753175735474, "created_at": "2025-06-03T03:49:24.283942+00:00"} {"global_step": 230362, "acc_step": 0, "speed/wps": 5539.877284830175, "speed/FLOPS": 244834220327046.9, "speed/curr_iter_time": 2.9554, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9554, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.11, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05545790120959282, "optim/lr": 3.0644477591292184e-05, "optim/total_tokens": 1932416516096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3101524114608765, "created_at": "2025-06-03T03:49:27.247185+00:00"} {"global_step": 230363, "acc_step": 0, "speed/wps": 5536.07139690038, "speed/FLOPS": 244666019560850.34, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.29, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0405459925532341, "optim/lr": 3.064093036619786e-05, "optim/total_tokens": 1932424904704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3024232387542725, "created_at": "2025-06-03T03:49:30.213639+00:00"} {"global_step": 230364, "acc_step": 0, "speed/wps": 5529.514437885428, "speed/FLOPS": 244376235533948.12, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.049876999109983444, "optim/lr": 3.0637383141103315e-05, "optim/total_tokens": 1932433293312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2916358709335327, "created_at": "2025-06-03T03:49:33.180432+00:00"} {"global_step": 230365, "acc_step": 0, "speed/wps": 5521.63390610021, "speed/FLOPS": 244027956365259.72, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0459606796503067, "optim/lr": 3.0633835916008765e-05, "optim/total_tokens": 1932441681920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3048685789108276, "created_at": "2025-06-03T03:49:36.154916+00:00"} {"global_step": 230366, "acc_step": 0, "speed/wps": 5519.4219209359935, "speed/FLOPS": 243930197942967.78, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04967351257801056, "optim/lr": 3.063028869091422e-05, "optim/total_tokens": 1932450070528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3040722608566284, "created_at": "2025-06-03T03:49:39.129750+00:00"} {"global_step": 230367, "acc_step": 0, "speed/wps": 5516.5174794063505, "speed/FLOPS": 243801836493636.97, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04850488156080246, "optim/lr": 3.0626741465819896e-05, "optim/total_tokens": 1932458459136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.324190616607666, "created_at": "2025-06-03T03:49:42.104884+00:00"} {"global_step": 230368, "acc_step": 0, "speed/wps": 5512.966975469155, "speed/FLOPS": 243644922392739.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041632432490587234, "optim/lr": 3.0623194240725346e-05, "optim/total_tokens": 1932466847744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2911640405654907, "created_at": "2025-06-03T03:49:45.085103+00:00"} {"global_step": 230369, "acc_step": 0, "speed/wps": 5517.114172896298, "speed/FLOPS": 243828207291738.53, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.12 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.12, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04417752847075462, "optim/lr": 3.06196470156308e-05, "optim/total_tokens": 1932475236352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3069629669189453, "created_at": "2025-06-03T03:49:48.058948+00:00"} {"global_step": 230370, "acc_step": 0, "speed/wps": 5539.3111693917745, "speed/FLOPS": 244809200922311.1, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.22, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04081157594919205, "optim/lr": 3.061609979053625e-05, "optim/total_tokens": 1932483624960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3021353483200073, "created_at": "2025-06-03T03:49:51.020899+00:00"} {"global_step": 230371, "acc_step": 0, "speed/wps": 5535.460420218837, "speed/FLOPS": 244639017518788.25, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.29, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04504445940256119, "optim/lr": 3.0612552565441934e-05, "optim/total_tokens": 1932492013568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3037172555923462, "created_at": "2025-06-03T03:49:53.985707+00:00"} {"global_step": 230372, "acc_step": 0, "speed/wps": 5530.4278961819255, "speed/FLOPS": 244416605715149.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04288981482386589, "optim/lr": 3.0609005340347384e-05, "optim/total_tokens": 1932500402176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3057782649993896, "created_at": "2025-06-03T03:49:56.953342+00:00"} {"global_step": 230373, "acc_step": 0, "speed/wps": 5528.091008176411, "speed/FLOPS": 244313327226583.3, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04379662871360779, "optim/lr": 3.060545811525284e-05, "optim/total_tokens": 1932508790784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3041348457336426, "created_at": "2025-06-03T03:49:59.921667+00:00"} {"global_step": 230374, "acc_step": 0, "speed/wps": 5530.767790495054, "speed/FLOPS": 244431627304053.38, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.51, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040987469255924225, "optim/lr": 3.060191089015829e-05, "optim/total_tokens": 1932517179392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.303524374961853, "created_at": "2025-06-03T03:50:02.888059+00:00"} {"global_step": 230375, "acc_step": 0, "speed/wps": 5522.780689507127, "speed/FLOPS": 244078638322075.88, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04343869909644127, "optim/lr": 3.0598363665063965e-05, "optim/total_tokens": 1932525568000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.29482102394104, "created_at": "2025-06-03T03:50:05.861358+00:00"} {"global_step": 230376, "acc_step": 0, "speed/wps": 5525.484549915357, "speed/FLOPS": 244198135112507.5, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04163847118616104, "optim/lr": 3.059481643996942e-05, "optim/total_tokens": 1932533956608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.309360146522522, "created_at": "2025-06-03T03:50:08.830908+00:00"} {"global_step": 230377, "acc_step": 0, "speed/wps": 5536.372205823312, "speed/FLOPS": 244679313775564.25, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.33, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05403285473585129, "optim/lr": 3.059126921487487e-05, "optim/total_tokens": 1932542345216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3049349784851074, "created_at": "2025-06-03T03:50:11.800717+00:00"} {"global_step": 230378, "acc_step": 0, "speed/wps": 5531.290219654024, "speed/FLOPS": 244454715998845.03, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04106255620718002, "optim/lr": 3.0587721989780546e-05, "optim/total_tokens": 1932550733824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2990646362304688, "created_at": "2025-06-03T03:50:14.769410+00:00"} {"global_step": 230379, "acc_step": 0, "speed/wps": 5529.551069457188, "speed/FLOPS": 244377854461922.5, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.56, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.049226466566324234, "optim/lr": 3.0584174764686e-05, "optim/total_tokens": 1932559122432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2931736707687378, "created_at": "2025-06-03T03:50:17.737885+00:00"} {"global_step": 230380, "acc_step": 0, "speed/wps": 5522.826473137706, "speed/FLOPS": 244080661724205.6, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.047936420887708664, "optim/lr": 3.0580627539591453e-05, "optim/total_tokens": 1932567511040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3053456544876099, "created_at": "2025-06-03T03:50:20.709238+00:00"} {"global_step": 230381, "acc_step": 0, "speed/wps": 5516.4474742818065, "speed/FLOPS": 243798742625450.84, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0022, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04208889603614807, "optim/lr": 3.057708031449691e-05, "optim/total_tokens": 1932575899648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3080917596817017, "created_at": "2025-06-03T03:50:23.682475+00:00"} {"global_step": 230382, "acc_step": 0, "speed/wps": 5517.028867329832, "speed/FLOPS": 243824437222334.2, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0427824892103672, "optim/lr": 3.0573533089402584e-05, "optim/total_tokens": 1932584288256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3031960725784302, "created_at": "2025-06-03T03:50:26.655777+00:00"} {"global_step": 230383, "acc_step": 0, "speed/wps": 5523.385434802311, "speed/FLOPS": 244105364968755.97, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04165525361895561, "optim/lr": 3.0569985864308034e-05, "optim/total_tokens": 1932592676864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2988524436950684, "created_at": "2025-06-03T03:50:29.626324+00:00"} {"global_step": 230384, "acc_step": 0, "speed/wps": 5518.869384512605, "speed/FLOPS": 243905778661191.84, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.039660803973674774, "optim/lr": 3.056643863921349e-05, "optim/total_tokens": 1932601065472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2956641912460327, "created_at": "2025-06-03T03:50:32.598767+00:00"} {"global_step": 230385, "acc_step": 0, "speed/wps": 5515.160988510248, "speed/FLOPS": 243741886539179.06, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.044238701462745667, "optim/lr": 3.056289141411894e-05, "optim/total_tokens": 1932609454080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3106162548065186, "created_at": "2025-06-03T03:50:35.573300+00:00"} {"global_step": 230386, "acc_step": 0, "speed/wps": 5534.4169493287845, "speed/FLOPS": 244592901446416.16, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.39, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04110369086265564, "optim/lr": 3.0559344189024616e-05, "optim/total_tokens": 1932617842688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.322613000869751, "created_at": "2025-06-03T03:50:38.538020+00:00"} {"global_step": 230387, "acc_step": 0, "speed/wps": 5533.887010268715, "speed/FLOPS": 244569480852435.1, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.41, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.042865775525569916, "optim/lr": 3.055579696393007e-05, "optim/total_tokens": 1932626231296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3067392110824585, "created_at": "2025-06-03T03:50:41.504536+00:00"} {"global_step": 230388, "acc_step": 0, "speed/wps": 5522.349826297546, "speed/FLOPS": 244059596373570.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.0411948561668396, "optim/lr": 3.055224973883552e-05, "optim/total_tokens": 1932634619904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2914135456085205, "created_at": "2025-06-03T03:50:44.475032+00:00"} {"global_step": 230389, "acc_step": 0, "speed/wps": 5525.808777543472, "speed/FLOPS": 244212464314122.75, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04111625626683235, "optim/lr": 3.054870251374098e-05, "optim/total_tokens": 1932643008512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.296440601348877, "created_at": "2025-06-03T03:50:47.446895+00:00"} {"global_step": 230390, "acc_step": 0, "speed/wps": 5528.398937754393, "speed/FLOPS": 244326936137803.62, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.040787145495414734, "optim/lr": 3.0545155288646654e-05, "optim/total_tokens": 1932651397120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.292202353477478, "created_at": "2025-06-03T03:50:50.414258+00:00"} {"global_step": 230391, "acc_step": 0, "speed/wps": 5524.205276789411, "speed/FLOPS": 244141597788254.12, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041397593915462494, "optim/lr": 3.0541608063552104e-05, "optim/total_tokens": 1932659785728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2920231819152832, "created_at": "2025-06-03T03:50:53.384081+00:00"} {"global_step": 230392, "acc_step": 0, "speed/wps": 5523.546355871574, "speed/FLOPS": 244112476856348.7, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.041017044335603714, "optim/lr": 3.053806083845756e-05, "optim/total_tokens": 1932668174336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2951115369796753, "created_at": "2025-06-03T03:50:56.354323+00:00"} {"global_step": 230393, "acc_step": 0, "speed/wps": 5505.680516218838, "speed/FLOPS": 243322898189354.9, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04075566306710243, "optim/lr": 3.053451361336301e-05, "optim/total_tokens": 1932676562944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3034943342208862, "created_at": "2025-06-03T03:50:59.334091+00:00"} {"global_step": 230394, "acc_step": 0, "speed/wps": 5536.21716271229, "speed/FLOPS": 244672461663639.7, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 189.34, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04379504546523094, "optim/lr": 3.053096638826869e-05, "optim/total_tokens": 1932684951552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3138655424118042, "created_at": "2025-06-03T03:51:02.297677+00:00"} {"global_step": 230395, "acc_step": 0, "speed/wps": 5505.683345065792, "speed/FLOPS": 243323023209910.9, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.11 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.11, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.04212465509772301, "optim/lr": 3.052741916317414e-05, "optim/total_tokens": 1932693340160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3144445419311523, "created_at": "2025-06-03T03:51:05.280140+00:00"} {"global_step": 230396, "acc_step": 0, "speed/wps": 5519.515512410843, "speed/FLOPS": 243934334207111.56, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.046973250806331635, "optim/lr": 3.052387193807959e-05, "optim/total_tokens": 1932701728768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2991619110107422, "created_at": "2025-06-03T03:51:08.255549+00:00"} {"global_step": 230397, "acc_step": 0, "speed/wps": 5516.438027788998, "speed/FLOPS": 243798325138820.22, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.1 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.1, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.049948520958423615, "optim/lr": 3.052032471298505e-05, "optim/total_tokens": 1932710117376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3042484521865845, "created_at": "2025-06-03T03:51:11.229195+00:00"} {"global_step": 230398, "acc_step": 0, "speed/wps": 5525.940764652154, "speed/FLOPS": 244218297468755.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04060865938663483, "optim/lr": 3.0516777487890723e-05, "optim/total_tokens": 1932718505984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2808465957641602, "created_at": "2025-06-03T03:51:14.200138+00:00"} {"global_step": 230399, "acc_step": 0, "speed/wps": 5522.386684574789, "speed/FLOPS": 244061225320766.6, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.09 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.09, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.05234833434224129, "optim/lr": 3.0513230262796176e-05, "optim/total_tokens": 1932726894592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3126314878463745, "created_at": "2025-06-03T03:51:17.170846+00:00"} {"global_step": 230400, "acc_step": 0, "speed/wps": 5527.421931598451, "speed/FLOPS": 244283757466481.84, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04621334746479988, "optim/lr": 3.050968303770163e-05, "optim/total_tokens": 1932735283200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.46484375, "memory/max_reserved_pct": 66.7694091796875, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.3084666728973389, "created_at": "2025-06-03T03:51:20.143455+00:00"} {"global_step": 230401, "acc_step": 0, "speed/wps": 236.32265324730557, "speed/FLOPS": 10444251664537.875, "speed/curr_iter_time": 2.8793, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.8793, "speed/est_time_elapsed": "7.68 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 184.28, "speed/est_time_elapsed_days": 7.68, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045448314398527145, "optim/lr": 3.0506135812607084e-05, "optim/total_tokens": 1932743671808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3062318563461304, "created_at": "2025-06-03T03:52:29.479459+00:00"} {"global_step": 230402, "acc_step": 0, "speed/wps": 5641.359225160392, "speed/FLOPS": 249319202657984.28, "speed/curr_iter_time": 2.9032, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9032, "speed/est_time_elapsed": "7.74 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 185.81, "speed/est_time_elapsed_days": 7.74, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05225031450390816, "optim/lr": 3.0502588587512758e-05, "optim/total_tokens": 1932752060416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3079675436019897, "created_at": "2025-06-03T03:52:32.390057+00:00"} {"global_step": 230403, "acc_step": 0, "speed/wps": 5576.546184967805, "speed/FLOPS": 246454798024684.88, "speed/curr_iter_time": 2.9361, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9361, "speed/est_time_elapsed": "7.83 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 187.91, "speed/est_time_elapsed_days": 7.83, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041760239750146866, "optim/lr": 3.049904136241821e-05, "optim/total_tokens": 1932760449024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2972674369812012, "created_at": "2025-06-03T03:52:35.336692+00:00"} {"global_step": 230404, "acc_step": 0, "speed/wps": 5545.926139511798, "speed/FLOPS": 245101548743129.72, "speed/curr_iter_time": 2.9533, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9533, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.01, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04611866548657417, "optim/lr": 3.0495494137323665e-05, "optim/total_tokens": 1932768837632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3112761974334717, "created_at": "2025-06-03T03:52:38.299039+00:00"} {"global_step": 230405, "acc_step": 0, "speed/wps": 5547.432242208339, "speed/FLOPS": 245168110773384.38, "speed/curr_iter_time": 2.9525, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9525, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 188.96, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040916360914707184, "optim/lr": 3.049194691222934e-05, "optim/total_tokens": 1932777226240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3043793439865112, "created_at": "2025-06-03T03:52:41.260253+00:00"} {"global_step": 230406, "acc_step": 0, "speed/wps": 5556.289268510004, "speed/FLOPS": 245559546001547.72, "speed/curr_iter_time": 2.947, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.947, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 188.61, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04635215550661087, "optim/lr": 3.0488399687134792e-05, "optim/total_tokens": 1932785614848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2994848489761353, "created_at": "2025-06-03T03:52:44.217721+00:00"} {"global_step": 230407, "acc_step": 0, "speed/wps": 5549.696490772737, "speed/FLOPS": 245268178970456.03, "speed/curr_iter_time": 2.9513, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9513, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 188.89, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042266812175512314, "optim/lr": 3.0484852462040246e-05, "optim/total_tokens": 1932794003456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3048754930496216, "created_at": "2025-06-03T03:52:47.177184+00:00"} {"global_step": 230408, "acc_step": 0, "speed/wps": 5540.735242433991, "speed/FLOPS": 244872137661710.47, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.2, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.047249484807252884, "optim/lr": 3.04813052369457e-05, "optim/total_tokens": 1932802392064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3015294075012207, "created_at": "2025-06-03T03:52:50.141754+00:00"} {"global_step": 230409, "acc_step": 0, "speed/wps": 5543.025305854894, "speed/FLOPS": 244973346743307.22, "speed/curr_iter_time": 2.9549, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9549, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.12, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0543668195605278, "optim/lr": 3.0477758011851377e-05, "optim/total_tokens": 1932810780672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.298553705215454, "created_at": "2025-06-03T03:52:53.106178+00:00"} {"global_step": 230410, "acc_step": 0, "speed/wps": 5555.988340048317, "speed/FLOPS": 245546246503832.66, "speed/curr_iter_time": 2.9466, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9466, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 188.59, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04197172448039055, "optim/lr": 3.047421078675683e-05, "optim/total_tokens": 1932819169280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.3163878917694092, "created_at": "2025-06-03T03:52:56.063664+00:00"} {"global_step": 230411, "acc_step": 0, "speed/wps": 5529.691665749771, "speed/FLOPS": 244384068098417.66, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 189.58, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04116550460457802, "optim/lr": 3.047066356166228e-05, "optim/total_tokens": 1932827557888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.3037859201431274, "created_at": "2025-06-03T03:52:59.034607+00:00"} {"global_step": 230412, "acc_step": 0, "speed/wps": 5522.673871211542, "speed/FLOPS": 244073917500156.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04601748660206795, "optim/lr": 3.0467116336567734e-05, "optim/total_tokens": 1932835946496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3064022064208984, "created_at": "2025-06-03T03:53:02.008312+00:00"} {"global_step": 230413, "acc_step": 0, "speed/wps": 5514.584111436974, "speed/FLOPS": 243716391525264.9, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.3, "optim/grad_norm": 0.045125313103199005, "optim/lr": 3.046356911147341e-05, "optim/total_tokens": 1932844335104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.297829270362854, "created_at": "2025-06-03T03:53:04.987330+00:00"} {"global_step": 230414, "acc_step": 0, "speed/wps": 5545.308933606463, "speed/FLOPS": 245074271401260.12, "speed/curr_iter_time": 2.9537, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9537, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.05, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041222747415304184, "optim/lr": 3.0460021886378865e-05, "optim/total_tokens": 1932852723712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3004333972930908, "created_at": "2025-06-03T03:53:07.946814+00:00"} {"global_step": 230415, "acc_step": 0, "speed/wps": 5554.414709553364, "speed/FLOPS": 245476700090526.78, "speed/curr_iter_time": 2.9489, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9489, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 188.74, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04456344619393349, "optim/lr": 3.045647466128432e-05, "optim/total_tokens": 1932861112320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2913843393325806, "created_at": "2025-06-03T03:53:10.904372+00:00"} {"global_step": 230416, "acc_step": 0, "speed/wps": 5522.719427250313, "speed/FLOPS": 244075930843893.34, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040674932301044464, "optim/lr": 3.045292743618977e-05, "optim/total_tokens": 1932869500928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.295923113822937, "created_at": "2025-06-03T03:53:13.877536+00:00"} {"global_step": 230417, "acc_step": 0, "speed/wps": 5518.068585988964, "speed/FLOPS": 243870387465305.28, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.08 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.08, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042227085679769516, "optim/lr": 3.0449380211095446e-05, "optim/total_tokens": 1932877889536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.287309169769287, "created_at": "2025-06-03T03:53:16.856041+00:00"} {"global_step": 230418, "acc_step": 0, "speed/wps": 5533.199511682411, "speed/FLOPS": 244539096933857.2, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04241723567247391, "optim/lr": 3.04458329860009e-05, "optim/total_tokens": 1932886278144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.3130629062652588, "created_at": "2025-06-03T03:53:19.821322+00:00"} {"global_step": 230419, "acc_step": 0, "speed/wps": 5533.394755441305, "speed/FLOPS": 244547725708652.2, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04358425736427307, "optim/lr": 3.0442285760906353e-05, "optim/total_tokens": 1932894666752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.308112382888794, "created_at": "2025-06-03T03:53:22.789478+00:00"} {"global_step": 230420, "acc_step": 0, "speed/wps": 5521.994947538546, "speed/FLOPS": 244043912548856.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04090392589569092, "optim/lr": 3.0438738535811807e-05, "optim/total_tokens": 1932903055360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2918074131011963, "created_at": "2025-06-03T03:53:25.763150+00:00"} {"global_step": 230421, "acc_step": 0, "speed/wps": 5519.225008790227, "speed/FLOPS": 243921495434012.62, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04753107577562332, "optim/lr": 3.043519131071748e-05, "optim/total_tokens": 1932911443968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3000564575195312, "created_at": "2025-06-03T03:53:28.739303+00:00"} {"global_step": 230422, "acc_step": 0, "speed/wps": 5534.605815164829, "speed/FLOPS": 244601248349666.34, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.43, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04298269748687744, "optim/lr": 3.0431644085622934e-05, "optim/total_tokens": 1932919832576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.313316822052002, "created_at": "2025-06-03T03:53:31.706857+00:00"} {"global_step": 230423, "acc_step": 0, "speed/wps": 5543.196643591108, "speed/FLOPS": 244980918994261.84, "speed/curr_iter_time": 2.9541, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9541, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.08, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.06452586501836777, "optim/lr": 3.0428096860528388e-05, "optim/total_tokens": 1932928221184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.303113341331482, "created_at": "2025-06-03T03:53:34.669207+00:00"} {"global_step": 230424, "acc_step": 0, "speed/wps": 5533.2292872338985, "speed/FLOPS": 244540412860827.88, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04285378381609917, "optim/lr": 3.042454963543384e-05, "optim/total_tokens": 1932936609792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2924871444702148, "created_at": "2025-06-03T03:53:37.636059+00:00"} {"global_step": 230425, "acc_step": 0, "speed/wps": 5532.185357272792, "speed/FLOPS": 244494276499864.9, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.51, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.062465980648994446, "optim/lr": 3.0421002410339515e-05, "optim/total_tokens": 1932944998400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3034682273864746, "created_at": "2025-06-03T03:53:40.601335+00:00"} {"global_step": 230426, "acc_step": 0, "speed/wps": 5529.7860551563235, "speed/FLOPS": 244388239627058.47, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04494696855545044, "optim/lr": 3.041745518524497e-05, "optim/total_tokens": 1932953387008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3005107641220093, "created_at": "2025-06-03T03:53:43.568671+00:00"} {"global_step": 230427, "acc_step": 0, "speed/wps": 5522.018542968797, "speed/FLOPS": 244044955346101.3, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.053217072039842606, "optim/lr": 3.0413907960150422e-05, "optim/total_tokens": 1932961775616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.306867241859436, "created_at": "2025-06-03T03:53:46.543694+00:00"} {"global_step": 230428, "acc_step": 0, "speed/wps": 5521.7416360938105, "speed/FLOPS": 244032717479564.78, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044329844415187836, "optim/lr": 3.0410360735055876e-05, "optim/total_tokens": 1932970164224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.294957160949707, "created_at": "2025-06-03T03:53:49.517708+00:00"} {"global_step": 230429, "acc_step": 0, "speed/wps": 5521.63895322984, "speed/FLOPS": 244028179422555.8, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04718853533267975, "optim/lr": 3.040681350996155e-05, "optim/total_tokens": 1932978552832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3110860586166382, "created_at": "2025-06-03T03:53:52.492987+00:00"} {"global_step": 230430, "acc_step": 0, "speed/wps": 5519.99308905429, "speed/FLOPS": 243955440650293.06, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04181244224309921, "optim/lr": 3.0403266284867003e-05, "optim/total_tokens": 1932986941440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.310246467590332, "created_at": "2025-06-03T03:53:55.469281+00:00"} {"global_step": 230431, "acc_step": 0, "speed/wps": 5512.411483644653, "speed/FLOPS": 243620372497361.47, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.046691957861185074, "optim/lr": 3.0399719059772457e-05, "optim/total_tokens": 1932995330048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3043688535690308, "created_at": "2025-06-03T03:53:58.447941+00:00"} {"global_step": 230432, "acc_step": 0, "speed/wps": 5540.631136055965, "speed/FLOPS": 244867536692666.47, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.22, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0406869612634182, "optim/lr": 3.039617183467813e-05, "optim/total_tokens": 1933003718656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3156929016113281, "created_at": "2025-06-03T03:54:01.411717+00:00"} {"global_step": 230433, "acc_step": 0, "speed/wps": 5524.668354202034, "speed/FLOPS": 244162063439646.97, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04644959419965744, "optim/lr": 3.0392624609583585e-05, "optim/total_tokens": 1933012107264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3047449588775635, "created_at": "2025-06-03T03:54:04.386124+00:00"} {"global_step": 230434, "acc_step": 0, "speed/wps": 5529.664716189928, "speed/FLOPS": 244382877065812.94, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04070184379816055, "optim/lr": 3.0389077384489038e-05, "optim/total_tokens": 1933020495872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2905281782150269, "created_at": "2025-06-03T03:54:07.353854+00:00"} {"global_step": 230435, "acc_step": 0, "speed/wps": 5524.249049661675, "speed/FLOPS": 244143532325158.28, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04250270873308182, "optim/lr": 3.0385530159394492e-05, "optim/total_tokens": 1933028884480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3157894611358643, "created_at": "2025-06-03T03:54:10.324867+00:00"} {"global_step": 230436, "acc_step": 0, "speed/wps": 5513.77121816464, "speed/FLOPS": 243680465803392.7, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04338683933019638, "optim/lr": 3.038198293430017e-05, "optim/total_tokens": 1933037273088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.294988751411438, "created_at": "2025-06-03T03:54:13.300191+00:00"} {"global_step": 230437, "acc_step": 0, "speed/wps": 5517.477940352303, "speed/FLOPS": 243844283951363.3, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.043028783053159714, "optim/lr": 3.037843570920562e-05, "optim/total_tokens": 1933045661696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2983250617980957, "created_at": "2025-06-03T03:54:16.273577+00:00"} {"global_step": 230438, "acc_step": 0, "speed/wps": 5516.127179507973, "speed/FLOPS": 243784587235864.66, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040888525545597076, "optim/lr": 3.0374888484111073e-05, "optim/total_tokens": 1933054050304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2962864637374878, "created_at": "2025-06-03T03:54:19.250899+00:00"} {"global_step": 230439, "acc_step": 0, "speed/wps": 5518.4451385745515, "speed/FLOPS": 243887029162217.4, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04241548851132393, "optim/lr": 3.0371341259016526e-05, "optim/total_tokens": 1933062438912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.293182373046875, "created_at": "2025-06-03T03:54:22.225539+00:00"} {"global_step": 230440, "acc_step": 0, "speed/wps": 5530.90633287021, "speed/FLOPS": 244437750167911.1, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.5, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04206747189164162, "optim/lr": 3.0367794033922204e-05, "optim/total_tokens": 1933070827520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3041633367538452, "created_at": "2025-06-03T03:54:25.194777+00:00"} {"global_step": 230441, "acc_step": 0, "speed/wps": 5525.987732433986, "speed/FLOPS": 244220373204309.28, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04213333502411842, "optim/lr": 3.0364246808827657e-05, "optim/total_tokens": 1933079216128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.310392141342163, "created_at": "2025-06-03T03:54:28.166926+00:00"} {"global_step": 230442, "acc_step": 0, "speed/wps": 5515.749287301035, "speed/FLOPS": 243767886334545.7, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04319863021373749, "optim/lr": 3.0360699583733107e-05, "optim/total_tokens": 1933087604736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3125025033950806, "created_at": "2025-06-03T03:54:31.142367+00:00"} {"global_step": 230443, "acc_step": 0, "speed/wps": 5520.698501180053, "speed/FLOPS": 243986616255625.22, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04326697811484337, "optim/lr": 3.035715235863856e-05, "optim/total_tokens": 1933095993344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.293521761894226, "created_at": "2025-06-03T03:54:34.116273+00:00"} {"global_step": 230444, "acc_step": 0, "speed/wps": 5512.435603095382, "speed/FLOPS": 243621438453629.12, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042798541486263275, "optim/lr": 3.0353605133544238e-05, "optim/total_tokens": 1933104381952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3207002878189087, "created_at": "2025-06-03T03:54:37.092637+00:00"} {"global_step": 230445, "acc_step": 0, "speed/wps": 5508.771727901533, "speed/FLOPS": 243459513923474.28, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.07 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.07, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04384022206068039, "optim/lr": 3.0350057908449692e-05, "optim/total_tokens": 1933112770560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.3071991205215454, "created_at": "2025-06-03T03:54:40.072415+00:00"} {"global_step": 230446, "acc_step": 0, "speed/wps": 5512.4743825018595, "speed/FLOPS": 243623152304904.44, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.06 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.06, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04632282257080078, "optim/lr": 3.0346510683355145e-05, "optim/total_tokens": 1933121159168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2974157333374023, "created_at": "2025-06-03T03:54:43.048993+00:00"} {"global_step": 230447, "acc_step": 0, "speed/wps": 5514.8148515008725, "speed/FLOPS": 243726589055054.5, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040707118809223175, "optim/lr": 3.0342963458260596e-05, "optim/total_tokens": 1933129547776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2940654754638672, "created_at": "2025-06-03T03:54:46.027106+00:00"} {"global_step": 230448, "acc_step": 0, "speed/wps": 5525.175800478351, "speed/FLOPS": 244184489967714.72, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04458333179354668, "optim/lr": 3.0339416233166273e-05, "optim/total_tokens": 1933137936384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.315806269645691, "created_at": "2025-06-03T03:54:48.999098+00:00"} {"global_step": 230449, "acc_step": 0, "speed/wps": 5515.274902553724, "speed/FLOPS": 243746920956835.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04149828478693962, "optim/lr": 3.0335869008071727e-05, "optim/total_tokens": 1933146324992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2904444932937622, "created_at": "2025-06-03T03:54:51.973890+00:00"} {"global_step": 230450, "acc_step": 0, "speed/wps": 5524.444169275198, "speed/FLOPS": 244152155613363.3, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.055209893733263016, "optim/lr": 3.033232178297718e-05, "optim/total_tokens": 1933154713600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2911673784255981, "created_at": "2025-06-03T03:54:54.946068+00:00"} {"global_step": 230451, "acc_step": 0, "speed/wps": 5515.58668110684, "speed/FLOPS": 243760699973056.2, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040978413075208664, "optim/lr": 3.0328774557882634e-05, "optim/total_tokens": 1933163102208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3018064498901367, "created_at": "2025-06-03T03:54:57.921791+00:00"} {"global_step": 230452, "acc_step": 0, "speed/wps": 5518.383296065925, "speed/FLOPS": 243884296039874.75, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044175997376441956, "optim/lr": 3.0325227332788308e-05, "optim/total_tokens": 1933171490816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3126901388168335, "created_at": "2025-06-03T03:55:00.894850+00:00"} {"global_step": 230453, "acc_step": 0, "speed/wps": 5520.71436511264, "speed/FLOPS": 243987317360246.56, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04147261008620262, "optim/lr": 3.032168010769376e-05, "optim/total_tokens": 1933179879424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2973748445510864, "created_at": "2025-06-03T03:55:03.866833+00:00"} {"global_step": 230454, "acc_step": 0, "speed/wps": 5516.1201685339565, "speed/FLOPS": 243784277386698.56, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04305298998951912, "optim/lr": 3.0318132882599215e-05, "optim/total_tokens": 1933188268032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2932732105255127, "created_at": "2025-06-03T03:55:06.844520+00:00"} {"global_step": 230455, "acc_step": 0, "speed/wps": 5517.752664885001, "speed/FLOPS": 243856425369540.9, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04360421746969223, "optim/lr": 3.031458565750467e-05, "optim/total_tokens": 1933196656640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3061726093292236, "created_at": "2025-06-03T03:55:09.818338+00:00"} {"global_step": 230456, "acc_step": 0, "speed/wps": 5528.8326263815, "speed/FLOPS": 244346102955302.12, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04251064732670784, "optim/lr": 3.0311038432410342e-05, "optim/total_tokens": 1933205045248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3054149150848389, "created_at": "2025-06-03T03:55:12.788550+00:00"} {"global_step": 230457, "acc_step": 0, "speed/wps": 5528.280890488626, "speed/FLOPS": 244321719052877.4, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04445989057421684, "optim/lr": 3.0307491207315796e-05, "optim/total_tokens": 1933213433856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.297892451286316, "created_at": "2025-06-03T03:55:15.756722+00:00"} {"global_step": 230458, "acc_step": 0, "speed/wps": 5526.566375101011, "speed/FLOPS": 244245946248430.1, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04162757098674774, "optim/lr": 3.030394398222125e-05, "optim/total_tokens": 1933221822464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3036643266677856, "created_at": "2025-06-03T03:55:18.728327+00:00"} {"global_step": 230459, "acc_step": 0, "speed/wps": 5510.86831135857, "speed/FLOPS": 243552172180988.38, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0492452010512352, "optim/lr": 3.0300396757126923e-05, "optim/total_tokens": 1933230211072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3008177280426025, "created_at": "2025-06-03T03:55:21.708491+00:00"} {"global_step": 230460, "acc_step": 0, "speed/wps": 5508.791789323105, "speed/FLOPS": 243460400535624.1, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04417583346366882, "optim/lr": 3.0296849532032377e-05, "optim/total_tokens": 1933238599680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2998852729797363, "created_at": "2025-06-03T03:55:24.687215+00:00"} {"global_step": 230461, "acc_step": 0, "speed/wps": 5528.768653436095, "speed/FLOPS": 244343275678558.44, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04256545379757881, "optim/lr": 3.029330230693783e-05, "optim/total_tokens": 1933246988288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3015881776809692, "created_at": "2025-06-03T03:55:27.657892+00:00"} {"global_step": 230462, "acc_step": 0, "speed/wps": 5514.4913608407605, "speed/FLOPS": 243712292423652.84, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041507914662361145, "optim/lr": 3.0289755081843284e-05, "optim/total_tokens": 1933255376896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2957535982131958, "created_at": "2025-06-03T03:55:30.636074+00:00"} {"global_step": 230463, "acc_step": 0, "speed/wps": 5508.290635224961, "speed/FLOPS": 243438252089625.34, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.05 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.05, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04283701255917549, "optim/lr": 3.028620785674896e-05, "optim/total_tokens": 1933263765504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.294392704963684, "created_at": "2025-06-03T03:55:33.614923+00:00"} {"global_step": 230464, "acc_step": 0, "speed/wps": 5517.17357193961, "speed/FLOPS": 243830832425421.03, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04568028822541237, "optim/lr": 3.028266063165441e-05, "optim/total_tokens": 1933272154112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3050305843353271, "created_at": "2025-06-03T03:55:36.590782+00:00"} {"global_step": 230465, "acc_step": 0, "speed/wps": 5527.347330379228, "speed/FLOPS": 244280460474435.84, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042603183537721634, "optim/lr": 3.0279113406559865e-05, "optim/total_tokens": 1933280542720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.296386957168579, "created_at": "2025-06-03T03:55:39.561779+00:00"} {"global_step": 230466, "acc_step": 0, "speed/wps": 5522.058659389674, "speed/FLOPS": 244046728286569.62, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.046858515590429306, "optim/lr": 3.027556618146532e-05, "optim/total_tokens": 1933288931328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3205868005752563, "created_at": "2025-06-03T03:55:42.535539+00:00"} {"global_step": 230467, "acc_step": 0, "speed/wps": 5513.434988954839, "speed/FLOPS": 243665606193296.6, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040251463651657104, "optim/lr": 3.0272018956370996e-05, "optim/total_tokens": 1933297319936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3005601167678833, "created_at": "2025-06-03T03:55:45.513617+00:00"} {"global_step": 230468, "acc_step": 0, "speed/wps": 5518.576560347101, "speed/FLOPS": 243892837331886.47, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04561707377433777, "optim/lr": 3.026847173127645e-05, "optim/total_tokens": 1933305708544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3104960918426514, "created_at": "2025-06-03T03:55:48.489388+00:00"} {"global_step": 230469, "acc_step": 0, "speed/wps": 5521.609370743308, "speed/FLOPS": 244026872028068.0, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04053395614027977, "optim/lr": 3.02649245061819e-05, "optim/total_tokens": 1933314097152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2989566326141357, "created_at": "2025-06-03T03:55:51.464025+00:00"} {"global_step": 230470, "acc_step": 0, "speed/wps": 5518.058812442759, "speed/FLOPS": 243869955524588.56, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044780198484659195, "optim/lr": 3.0261377281087353e-05, "optim/total_tokens": 1933322485760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3005763292312622, "created_at": "2025-06-03T03:55:54.437771+00:00"} {"global_step": 230471, "acc_step": 0, "speed/wps": 5516.655864513426, "speed/FLOPS": 243807952407050.56, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04180967062711716, "optim/lr": 3.025783005599303e-05, "optim/total_tokens": 1933330874368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3060787916183472, "created_at": "2025-06-03T03:55:57.414493+00:00"} {"global_step": 230472, "acc_step": 0, "speed/wps": 5516.646207119465, "speed/FLOPS": 243807525599668.47, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05123415216803551, "optim/lr": 3.0254282830898484e-05, "optim/total_tokens": 1933339262976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.285178542137146, "created_at": "2025-06-03T03:56:00.392302+00:00"} {"global_step": 230473, "acc_step": 0, "speed/wps": 5519.180785219727, "speed/FLOPS": 243919540978553.3, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04791925102472305, "optim/lr": 3.0250735605803938e-05, "optim/total_tokens": 1933347651584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3007725477218628, "created_at": "2025-06-03T03:56:03.369293+00:00"} {"global_step": 230474, "acc_step": 0, "speed/wps": 5525.833238715904, "speed/FLOPS": 244213545372740.6, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0410233698785305, "optim/lr": 3.0247188380709388e-05, "optim/total_tokens": 1933356040192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2950514554977417, "created_at": "2025-06-03T03:56:06.338585+00:00"} {"global_step": 230475, "acc_step": 0, "speed/wps": 5521.021767974359, "speed/FLOPS": 244000902993304.1, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044571079313755035, "optim/lr": 3.0243641155615065e-05, "optim/total_tokens": 1933364428800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3191310167312622, "created_at": "2025-06-03T03:56:09.310248+00:00"} {"global_step": 230476, "acc_step": 0, "speed/wps": 5523.519347381791, "speed/FLOPS": 244111283219342.28, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04245097562670708, "optim/lr": 3.024009393052052e-05, "optim/total_tokens": 1933372817408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.305681586265564, "created_at": "2025-06-03T03:56:12.282602+00:00"} {"global_step": 230477, "acc_step": 0, "speed/wps": 5528.444160038072, "speed/FLOPS": 244328934731273.62, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.62, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04384619742631912, "optim/lr": 3.0236546705425972e-05, "optim/total_tokens": 1933381206016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3004283905029297, "created_at": "2025-06-03T03:56:15.252583+00:00"} {"global_step": 230478, "acc_step": 0, "speed/wps": 5519.189283570513, "speed/FLOPS": 243919916562159.53, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.03 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.03, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04365988448262215, "optim/lr": 3.0232999480331426e-05, "optim/total_tokens": 1933389594624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3251572847366333, "created_at": "2025-06-03T03:56:18.225229+00:00"} {"global_step": 230479, "acc_step": 0, "speed/wps": 5509.6562938230045, "speed/FLOPS": 243498607209584.5, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0455939956009388, "optim/lr": 3.02294522552371e-05, "optim/total_tokens": 1933397983232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3168452978134155, "created_at": "2025-06-03T03:56:21.205566+00:00"} {"global_step": 230480, "acc_step": 0, "speed/wps": 5517.528533823617, "speed/FLOPS": 243846519923834.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04602592810988426, "optim/lr": 3.0225905030142554e-05, "optim/total_tokens": 1933406371840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3094924688339233, "created_at": "2025-06-03T03:56:24.181731+00:00"} {"global_step": 230481, "acc_step": 0, "speed/wps": 5508.42945777339, "speed/FLOPS": 243444387335707.7, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.04 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.04, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042398255318403244, "optim/lr": 3.0222357805048007e-05, "optim/total_tokens": 1933414760448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3089828491210938, "created_at": "2025-06-03T03:56:27.161003+00:00"} {"global_step": 230482, "acc_step": 0, "speed/wps": 5530.971837736095, "speed/FLOPS": 244440645147698.94, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.6, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04185991734266281, "optim/lr": 3.021881057995346e-05, "optim/total_tokens": 1933423149056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3056998252868652, "created_at": "2025-06-03T03:56:30.127496+00:00"} {"global_step": 230483, "acc_step": 0, "speed/wps": 5526.267861577948, "speed/FLOPS": 244232753478641.44, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041877929121255875, "optim/lr": 3.0215263354859135e-05, "optim/total_tokens": 1933431537664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3054479360580444, "created_at": "2025-06-03T03:56:33.096828+00:00"} {"global_step": 230484, "acc_step": 0, "speed/wps": 5514.908954997513, "speed/FLOPS": 243730747947940.66, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04227248579263687, "optim/lr": 3.0211716129764588e-05, "optim/total_tokens": 1933439926272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3045523166656494, "created_at": "2025-06-03T03:56:36.075694+00:00"} {"global_step": 230485, "acc_step": 0, "speed/wps": 5525.384996031201, "speed/FLOPS": 244193735340390.75, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04161796346306801, "optim/lr": 3.0208168904670042e-05, "optim/total_tokens": 1933448314880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3037891387939453, "created_at": "2025-06-03T03:56:39.047164+00:00"} {"global_step": 230486, "acc_step": 0, "speed/wps": 5528.075991223545, "speed/FLOPS": 244312663554130.38, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041217587888240814, "optim/lr": 3.0204621679575716e-05, "optim/total_tokens": 1933456703488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3075661659240723, "created_at": "2025-06-03T03:56:42.019283+00:00"} {"global_step": 230487, "acc_step": 0, "speed/wps": 5512.063354942325, "speed/FLOPS": 243604986990602.75, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040657442063093185, "optim/lr": 3.020107445448117e-05, "optim/total_tokens": 1933465092096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2986066341400146, "created_at": "2025-06-03T03:56:44.999231+00:00"} {"global_step": 230488, "acc_step": 0, "speed/wps": 5517.515948855905, "speed/FLOPS": 243845963732677.34, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04073438048362732, "optim/lr": 3.0197527229386623e-05, "optim/total_tokens": 1933473480704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2973065376281738, "created_at": "2025-06-03T03:56:47.973174+00:00"} {"global_step": 230489, "acc_step": 0, "speed/wps": 5520.286608786152, "speed/FLOPS": 243968412720071.16, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041295915842056274, "optim/lr": 3.0193980004292076e-05, "optim/total_tokens": 1933481869312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.292886734008789, "created_at": "2025-06-03T03:56:50.947258+00:00"} {"global_step": 230490, "acc_step": 0, "speed/wps": 5512.819016488576, "speed/FLOPS": 243638383363120.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04162460193037987, "optim/lr": 3.019043277919775e-05, "optim/total_tokens": 1933490257920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3031727075576782, "created_at": "2025-06-03T03:56:53.923286+00:00"} {"global_step": 230491, "acc_step": 0, "speed/wps": 5516.11647106742, "speed/FLOPS": 243784113977603.0, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04072288051247597, "optim/lr": 3.0186885554103204e-05, "optim/total_tokens": 1933498646528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2912755012512207, "created_at": "2025-06-03T03:56:56.901162+00:00"} {"global_step": 230492, "acc_step": 0, "speed/wps": 5533.407080520709, "speed/FLOPS": 244548270414076.38, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 189.52, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04117834195494652, "optim/lr": 3.0183338329008657e-05, "optim/total_tokens": 1933507035136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3060613870620728, "created_at": "2025-06-03T03:56:59.869185+00:00"} {"global_step": 230493, "acc_step": 0, "speed/wps": 5517.214521641473, "speed/FLOPS": 243832642192643.8, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040585245937108994, "optim/lr": 3.017979110391411e-05, "optim/total_tokens": 1933515423744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3158131837844849, "created_at": "2025-06-03T03:57:02.842659+00:00"} {"global_step": 230494, "acc_step": 0, "speed/wps": 5521.304245705438, "speed/FLOPS": 244013387063165.66, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041898760944604874, "optim/lr": 3.0176243878819788e-05, "optim/total_tokens": 1933523812352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3157676458358765, "created_at": "2025-06-03T03:57:05.815746+00:00"} {"global_step": 230495, "acc_step": 0, "speed/wps": 5522.246558740796, "speed/FLOPS": 244055032476133.16, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041560184210538864, "optim/lr": 3.017269665372524e-05, "optim/total_tokens": 1933532200960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3138598203659058, "created_at": "2025-06-03T03:57:08.788873+00:00"} {"global_step": 230496, "acc_step": 0, "speed/wps": 5516.244060526823, "speed/FLOPS": 243789752778646.56, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04019748046994209, "optim/lr": 3.0169149428630692e-05, "optim/total_tokens": 1933540589568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.306632399559021, "created_at": "2025-06-03T03:57:11.765664+00:00"} {"global_step": 230497, "acc_step": 0, "speed/wps": 5507.912387643736, "speed/FLOPS": 243421535482581.8, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040797047317028046, "optim/lr": 3.0165602203536146e-05, "optim/total_tokens": 1933548978176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3103225231170654, "created_at": "2025-06-03T03:57:14.747724+00:00"} {"global_step": 230498, "acc_step": 0, "speed/wps": 5519.031001753975, "speed/FLOPS": 243912921316028.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042012009769678116, "optim/lr": 3.0162054978441823e-05, "optim/total_tokens": 1933557366784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3185138702392578, "created_at": "2025-06-03T03:57:17.720397+00:00"} {"global_step": 230499, "acc_step": 0, "speed/wps": 5530.835747766853, "speed/FLOPS": 244434630667630.06, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.62, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040089577436447144, "optim/lr": 3.0158507753347277e-05, "optim/total_tokens": 1933565755392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.293879508972168, "created_at": "2025-06-03T03:57:20.687502+00:00"} {"global_step": 230500, "acc_step": 0, "speed/wps": 5531.172815808367, "speed/FLOPS": 244449527349794.3, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04127275571227074, "optim/lr": 3.0154960528252727e-05, "optim/total_tokens": 1933574144000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.3060479164123535, "created_at": "2025-06-03T03:57:23.653497+00:00"} {"global_step": 230501, "acc_step": 0, "speed/wps": 5529.962938431803, "speed/FLOPS": 244396056962464.0, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.58, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04064495116472244, "optim/lr": 3.015141330315818e-05, "optim/total_tokens": 1933582532608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3136532306671143, "created_at": "2025-06-03T03:57:26.620301+00:00"} {"global_step": 230502, "acc_step": 0, "speed/wps": 5522.686324551159, "speed/FLOPS": 244074467874025.7, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042888205498456955, "optim/lr": 3.0147866078063858e-05, "optim/total_tokens": 1933590921216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3022701740264893, "created_at": "2025-06-03T03:57:29.592952+00:00"} {"global_step": 230503, "acc_step": 0, "speed/wps": 5520.739677774426, "speed/FLOPS": 243988436050335.56, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0417114794254303, "optim/lr": 3.014431885296931e-05, "optim/total_tokens": 1933599309824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2968887090682983, "created_at": "2025-06-03T03:57:32.565021+00:00"} {"global_step": 230504, "acc_step": 0, "speed/wps": 5506.037725614267, "speed/FLOPS": 243338685016269.4, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04091625660657883, "optim/lr": 3.0140771627874765e-05, "optim/total_tokens": 1933607698432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2966018915176392, "created_at": "2025-06-03T03:57:35.550009+00:00"} {"global_step": 230505, "acc_step": 0, "speed/wps": 5510.258907261426, "speed/FLOPS": 243525239639107.56, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042349644005298615, "optim/lr": 3.0137224402780215e-05, "optim/total_tokens": 1933616087040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3036028146743774, "created_at": "2025-06-03T03:57:38.527547+00:00"} {"global_step": 230506, "acc_step": 0, "speed/wps": 5529.272115400286, "speed/FLOPS": 244365526120423.75, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.67, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041682034730911255, "optim/lr": 3.0133677177685892e-05, "optim/total_tokens": 1933624475648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.297770380973816, "created_at": "2025-06-03T03:57:41.494425+00:00"} {"global_step": 230507, "acc_step": 0, "speed/wps": 5536.202170831366, "speed/FLOPS": 244671799099238.25, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.38, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.049169156700372696, "optim/lr": 3.0130129952591346e-05, "optim/total_tokens": 1933632864256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.291143536567688, "created_at": "2025-06-03T03:57:44.457599+00:00"} {"global_step": 230508, "acc_step": 0, "speed/wps": 5527.483603894302, "speed/FLOPS": 244286483066291.03, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04156240075826645, "optim/lr": 3.01265827274968e-05, "optim/total_tokens": 1933641252864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3112258911132812, "created_at": "2025-06-03T03:57:47.426108+00:00"} {"global_step": 230509, "acc_step": 0, "speed/wps": 5524.411267519082, "speed/FLOPS": 244150701524149.44, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.043633442372083664, "optim/lr": 3.0123035502402253e-05, "optim/total_tokens": 1933649641472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3186966180801392, "created_at": "2025-06-03T03:57:50.397663+00:00"} {"global_step": 230510, "acc_step": 0, "speed/wps": 5529.626164697235, "speed/FLOPS": 244381173287160.34, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04744106903672218, "optim/lr": 3.0119488277307927e-05, "optim/total_tokens": 1933658030080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.302312970161438, "created_at": "2025-06-03T03:57:53.364168+00:00"} {"global_step": 230511, "acc_step": 0, "speed/wps": 5513.0056768333825, "speed/FLOPS": 243646632794946.84, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044240552932024, "optim/lr": 3.011594105221338e-05, "optim/total_tokens": 1933666418688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2960134744644165, "created_at": "2025-06-03T03:57:56.340043+00:00"} {"global_step": 230512, "acc_step": 0, "speed/wps": 5501.649193158095, "speed/FLOPS": 243144734344252.0, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.02 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.02, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04404287040233612, "optim/lr": 3.0112393827118834e-05, "optim/total_tokens": 1933674807296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3042988777160645, "created_at": "2025-06-03T03:57:59.324761+00:00"} {"global_step": 230513, "acc_step": 0, "speed/wps": 5505.925427078215, "speed/FLOPS": 243333721995771.9, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04599403589963913, "optim/lr": 3.0108846602024508e-05, "optim/total_tokens": 1933683195904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3045282363891602, "created_at": "2025-06-03T03:58:02.305117+00:00"} {"global_step": 230514, "acc_step": 0, "speed/wps": 5510.461969161477, "speed/FLOPS": 243534213935724.78, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04210653156042099, "optim/lr": 3.010529937692996e-05, "optim/total_tokens": 1933691584512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2977550029754639, "created_at": "2025-06-03T03:58:05.283907+00:00"} {"global_step": 230515, "acc_step": 0, "speed/wps": 5510.983293729814, "speed/FLOPS": 243557253813264.22, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.01 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.01, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0423300676047802, "optim/lr": 3.0101752151835415e-05, "optim/total_tokens": 1933699973120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.283065915107727, "created_at": "2025-06-03T03:58:08.261575+00:00"} {"global_step": 230516, "acc_step": 0, "speed/wps": 5527.7129422745875, "speed/FLOPS": 244296618648839.4, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0406341589987278, "optim/lr": 3.009820492674087e-05, "optim/total_tokens": 1933708361728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3147072792053223, "created_at": "2025-06-03T03:58:11.229724+00:00"} {"global_step": 230517, "acc_step": 0, "speed/wps": 5522.402944359226, "speed/FLOPS": 244061943920013.6, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04444282874464989, "optim/lr": 3.0094657701646543e-05, "optim/total_tokens": 1933716750336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3025529384613037, "created_at": "2025-06-03T03:58:14.200601+00:00"} {"global_step": 230518, "acc_step": 0, "speed/wps": 5528.878568618302, "speed/FLOPS": 244348133367015.1, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041757188737392426, "optim/lr": 3.0091110476551996e-05, "optim/total_tokens": 1933725138944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.301086187362671, "created_at": "2025-06-03T03:58:17.172383+00:00"} {"global_step": 230519, "acc_step": 0, "speed/wps": 5522.152837358082, "speed/FLOPS": 244050890470726.72, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045455705374479294, "optim/lr": 3.008756325145745e-05, "optim/total_tokens": 1933733527552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3076050281524658, "created_at": "2025-06-03T03:58:20.146860+00:00"} {"global_step": 230520, "acc_step": 0, "speed/wps": 5516.917815948514, "speed/FLOPS": 243819529319692.4, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04661814495921135, "optim/lr": 3.0084016026362903e-05, "optim/total_tokens": 1933741916160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.320107340812683, "created_at": "2025-06-03T03:58:23.124509+00:00"} {"global_step": 230521, "acc_step": 0, "speed/wps": 5514.384116667555, "speed/FLOPS": 243707552780122.6, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04101324826478958, "optim/lr": 3.008046880126858e-05, "optim/total_tokens": 1933750304768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3120990991592407, "created_at": "2025-06-03T03:58:26.099580+00:00"} {"global_step": 230522, "acc_step": 0, "speed/wps": 5510.34822450274, "speed/FLOPS": 243529187004006.53, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "7.0 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 7.0, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041495367884635925, "optim/lr": 3.007692157617403e-05, "optim/total_tokens": 1933758693376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294384241104126, "created_at": "2025-06-03T03:58:29.079543+00:00"} {"global_step": 230523, "acc_step": 0, "speed/wps": 5514.432057133537, "speed/FLOPS": 243709671503337.44, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040473200380802155, "optim/lr": 3.0073374351079484e-05, "optim/total_tokens": 1933767081984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2940545082092285, "created_at": "2025-06-03T03:58:32.058906+00:00"} {"global_step": 230524, "acc_step": 0, "speed/wps": 5531.984871408079, "speed/FLOPS": 244485416050824.25, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.54, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0429510772228241, "optim/lr": 3.0069827125984938e-05, "optim/total_tokens": 1933775470592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3028160333633423, "created_at": "2025-06-03T03:58:35.028036+00:00"} {"global_step": 230525, "acc_step": 0, "speed/wps": 5536.513045969058, "speed/FLOPS": 244685538189121.03, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04094440117478371, "optim/lr": 3.0066279900890615e-05, "optim/total_tokens": 1933783859200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2901866436004639, "created_at": "2025-06-03T03:58:37.994856+00:00"} {"global_step": 230526, "acc_step": 0, "speed/wps": 5524.061988855489, "speed/FLOPS": 244135265194988.9, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0470721535384655, "optim/lr": 3.006273267579607e-05, "optim/total_tokens": 1933792247808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3226875066757202, "created_at": "2025-06-03T03:58:40.967119+00:00"} {"global_step": 230527, "acc_step": 0, "speed/wps": 5519.030919943735, "speed/FLOPS": 243912917700434.47, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05207205191254616, "optim/lr": 3.005918545070152e-05, "optim/total_tokens": 1933800636416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3040471076965332, "created_at": "2025-06-03T03:58:43.942713+00:00"} {"global_step": 230528, "acc_step": 0, "speed/wps": 5530.434163378292, "speed/FLOPS": 244416882693150.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.65, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041233837604522705, "optim/lr": 3.0055638225606973e-05, "optim/total_tokens": 1933809025024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.296233057975769, "created_at": "2025-06-03T03:58:46.912189+00:00"} {"global_step": 230529, "acc_step": 0, "speed/wps": 5523.898053984744, "speed/FLOPS": 244128020112796.72, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05544173717498779, "optim/lr": 3.005209100051265e-05, "optim/total_tokens": 1933817413632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3107017278671265, "created_at": "2025-06-03T03:58:49.887308+00:00"} {"global_step": 230530, "acc_step": 0, "speed/wps": 5514.224356422779, "speed/FLOPS": 243700492195030.56, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04231397062540054, "optim/lr": 3.0048543775418104e-05, "optim/total_tokens": 1933825802240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3015702962875366, "created_at": "2025-06-03T03:58:52.865727+00:00"} {"global_step": 230531, "acc_step": 0, "speed/wps": 5524.039320436167, "speed/FLOPS": 244134263366882.34, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04898644611239433, "optim/lr": 3.0044996550323557e-05, "optim/total_tokens": 1933834190848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3062360286712646, "created_at": "2025-06-03T03:58:55.835872+00:00"} {"global_step": 230532, "acc_step": 0, "speed/wps": 5531.726034920114, "speed/FLOPS": 244473976802901.44, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04738624766469002, "optim/lr": 3.0041449325229007e-05, "optim/total_tokens": 1933842579456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3023326396942139, "created_at": "2025-06-03T03:58:58.801546+00:00"} {"global_step": 230533, "acc_step": 0, "speed/wps": 5525.032948483589, "speed/FLOPS": 244178176640729.03, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04251004010438919, "optim/lr": 3.0037902100134685e-05, "optim/total_tokens": 1933850968064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2982650995254517, "created_at": "2025-06-03T03:59:01.772018+00:00"} {"global_step": 230534, "acc_step": 0, "speed/wps": 5525.670007925046, "speed/FLOPS": 244206331407275.6, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04490135237574577, "optim/lr": 3.0034354875040138e-05, "optim/total_tokens": 1933859356672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2980470657348633, "created_at": "2025-06-03T03:59:04.744934+00:00"} {"global_step": 230535, "acc_step": 0, "speed/wps": 5520.420995642235, "speed/FLOPS": 243974351931255.72, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04080864042043686, "optim/lr": 3.0030807649945592e-05, "optim/total_tokens": 1933867745280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3157483339309692, "created_at": "2025-06-03T03:59:07.716957+00:00"} {"global_step": 230536, "acc_step": 0, "speed/wps": 5519.456546073907, "speed/FLOPS": 243931728196836.03, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045293133705854416, "optim/lr": 3.0027260424851045e-05, "optim/total_tokens": 1933876133888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3108861446380615, "created_at": "2025-06-03T03:59:10.690205+00:00"} {"global_step": 230537, "acc_step": 0, "speed/wps": 5510.682965217939, "speed/FLOPS": 243543980830260.03, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040684737265110016, "optim/lr": 3.002371319975672e-05, "optim/total_tokens": 1933884522496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.288503646850586, "created_at": "2025-06-03T03:59:13.667937+00:00"} {"global_step": 230538, "acc_step": 0, "speed/wps": 5518.825566139425, "speed/FLOPS": 243903842113380.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0450788289308548, "optim/lr": 3.0020165974662173e-05, "optim/total_tokens": 1933892911104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2957440614700317, "created_at": "2025-06-03T03:59:16.640839+00:00"} {"global_step": 230539, "acc_step": 0, "speed/wps": 5523.198138122723, "speed/FLOPS": 244097087414189.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04086530581116676, "optim/lr": 3.0016618749567626e-05, "optim/total_tokens": 1933901299712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.30320143699646, "created_at": "2025-06-03T03:59:19.613797+00:00"} {"global_step": 230540, "acc_step": 0, "speed/wps": 5523.4192928843295, "speed/FLOPS": 244106861322679.84, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04382491856813431, "optim/lr": 3.00130715244733e-05, "optim/total_tokens": 1933909688320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2970671653747559, "created_at": "2025-06-03T03:59:22.584129+00:00"} {"global_step": 230541, "acc_step": 0, "speed/wps": 5534.119433813651, "speed/FLOPS": 244579752783469.7, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04253751039505005, "optim/lr": 3.0009524299378754e-05, "optim/total_tokens": 1933918076928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2882219552993774, "created_at": "2025-06-03T03:59:25.549731+00:00"} {"global_step": 230542, "acc_step": 0, "speed/wps": 5525.946736581662, "speed/FLOPS": 244218561397472.34, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04406644403934479, "optim/lr": 3.0005977074284208e-05, "optim/total_tokens": 1933926465536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3092970848083496, "created_at": "2025-06-03T03:59:28.518454+00:00"} {"global_step": 230543, "acc_step": 0, "speed/wps": 5519.602728860942, "speed/FLOPS": 243938188727791.66, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.043429985642433167, "optim/lr": 3.000242984918966e-05, "optim/total_tokens": 1933934854144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3211809396743774, "created_at": "2025-06-03T03:59:31.493679+00:00"} {"global_step": 230544, "acc_step": 0, "speed/wps": 5522.489587247874, "speed/FLOPS": 244065773092213.3, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044119395315647125, "optim/lr": 2.9998882624095335e-05, "optim/total_tokens": 1933943242752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.305079460144043, "created_at": "2025-06-03T03:59:34.464533+00:00"} {"global_step": 230545, "acc_step": 0, "speed/wps": 5516.296340333118, "speed/FLOPS": 243792063278492.47, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04463769868016243, "optim/lr": 2.999533539900079e-05, "optim/total_tokens": 1933951631360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2939765453338623, "created_at": "2025-06-03T03:59:37.441789+00:00"} {"global_step": 230546, "acc_step": 0, "speed/wps": 5526.69688483026, "speed/FLOPS": 244251714110453.6, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04038561135530472, "optim/lr": 2.9991788173906242e-05, "optim/total_tokens": 1933960019968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.293718695640564, "created_at": "2025-06-03T03:59:40.410583+00:00"} {"global_step": 230547, "acc_step": 0, "speed/wps": 5506.865105307559, "speed/FLOPS": 243375250963799.75, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04279249906539917, "optim/lr": 2.9988240948811696e-05, "optim/total_tokens": 1933968408576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3102872371673584, "created_at": "2025-06-03T03:59:43.390102+00:00"} {"global_step": 230548, "acc_step": 0, "speed/wps": 5526.3788361583975, "speed/FLOPS": 244237657987077.94, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04014754295349121, "optim/lr": 2.998469372371737e-05, "optim/total_tokens": 1933976797184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3122230768203735, "created_at": "2025-06-03T03:59:46.358420+00:00"} {"global_step": 230549, "acc_step": 0, "speed/wps": 5504.007325733751, "speed/FLOPS": 243248951734079.28, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.99 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.99, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04141447693109512, "optim/lr": 2.9981146498622823e-05, "optim/total_tokens": 1933985185792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2935454845428467, "created_at": "2025-06-03T03:59:49.341598+00:00"} {"global_step": 230550, "acc_step": 0, "speed/wps": 5531.552286977331, "speed/FLOPS": 244466298033153.03, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04152316600084305, "optim/lr": 2.9977599273528277e-05, "optim/total_tokens": 1933993574400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3073011636734009, "created_at": "2025-06-03T03:59:52.307747+00:00"} {"global_step": 230551, "acc_step": 0, "speed/wps": 5520.984324515906, "speed/FLOPS": 243999248184093.47, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04092401638627052, "optim/lr": 2.997405204843373e-05, "optim/total_tokens": 1934001963008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3023048639297485, "created_at": "2025-06-03T03:59:55.279740+00:00"} {"global_step": 230552, "acc_step": 0, "speed/wps": 5503.204000546126, "speed/FLOPS": 243213448872577.3, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.98 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.98, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042572490870952606, "optim/lr": 2.9970504823339408e-05, "optim/total_tokens": 1934010351616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.293747901916504, "created_at": "2025-06-03T03:59:58.260899+00:00"} {"global_step": 230553, "acc_step": 0, "speed/wps": 5524.072290181482, "speed/FLOPS": 244135720460870.78, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042254384607076645, "optim/lr": 2.9966957598244858e-05, "optim/total_tokens": 1934018740224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.3065768480300903, "created_at": "2025-06-03T04:00:01.234104+00:00"} {"global_step": 230554, "acc_step": 0, "speed/wps": 5518.566827414366, "speed/FLOPS": 243892407186077.28, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041645947843790054, "optim/lr": 2.996341037315031e-05, "optim/total_tokens": 1934027128832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.296584963798523, "created_at": "2025-06-03T04:00:04.210508+00:00"} {"global_step": 230555, "acc_step": 0, "speed/wps": 5511.300671733567, "speed/FLOPS": 243571280296542.2, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0416484996676445, "optim/lr": 2.9959863148055765e-05, "optim/total_tokens": 1934035517440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3107706308364868, "created_at": "2025-06-03T04:00:07.190222+00:00"} {"global_step": 230556, "acc_step": 0, "speed/wps": 5515.772862244477, "speed/FLOPS": 243768928226378.3, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045870404690504074, "optim/lr": 2.9956315922961442e-05, "optim/total_tokens": 1934043906048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3041400909423828, "created_at": "2025-06-03T04:00:10.165017+00:00"} {"global_step": 230557, "acc_step": 0, "speed/wps": 5515.1970437146, "speed/FLOPS": 243743479994664.16, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04554968699812889, "optim/lr": 2.9952768697866896e-05, "optim/total_tokens": 1934052294656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3043580055236816, "created_at": "2025-06-03T04:00:13.142548+00:00"} {"global_step": 230558, "acc_step": 0, "speed/wps": 5523.735639494237, "speed/FLOPS": 244120842223629.0, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04398437216877937, "optim/lr": 2.9949221472772346e-05, "optim/total_tokens": 1934060683264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3057308197021484, "created_at": "2025-06-03T04:00:16.112830+00:00"} {"global_step": 230559, "acc_step": 0, "speed/wps": 5528.902053059034, "speed/FLOPS": 244349171259091.2, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04280177876353264, "optim/lr": 2.99456742476778e-05, "optim/total_tokens": 1934069071872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3019803762435913, "created_at": "2025-06-03T04:00:19.080019+00:00"} {"global_step": 230560, "acc_step": 0, "speed/wps": 5522.905134018759, "speed/FLOPS": 244084138132525.25, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04450376704335213, "optim/lr": 2.9942127022583477e-05, "optim/total_tokens": 1934077460480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2897248268127441, "created_at": "2025-06-03T04:00:22.051738+00:00"} {"global_step": 230561, "acc_step": 0, "speed/wps": 5516.445991832434, "speed/FLOPS": 243798677108776.44, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042423006147146225, "optim/lr": 2.993857979748893e-05, "optim/total_tokens": 1934085849088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3013434410095215, "created_at": "2025-06-03T04:00:25.025961+00:00"} {"global_step": 230562, "acc_step": 0, "speed/wps": 5512.81807066157, "speed/FLOPS": 243638341562408.2, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042313914746046066, "optim/lr": 2.9935032572394384e-05, "optim/total_tokens": 1934094237696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3172521591186523, "created_at": "2025-06-03T04:00:28.002144+00:00"} {"global_step": 230563, "acc_step": 0, "speed/wps": 5520.040336840181, "speed/FLOPS": 243957528760593.34, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04810759425163269, "optim/lr": 2.9931485347299838e-05, "optim/total_tokens": 1934102626304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3100380897521973, "created_at": "2025-06-03T04:00:30.975450+00:00"} {"global_step": 230564, "acc_step": 0, "speed/wps": 5510.332326886022, "speed/FLOPS": 243528484410718.97, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.97 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.97, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041590865701436996, "optim/lr": 2.992793812220551e-05, "optim/total_tokens": 1934111014912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2974313497543335, "created_at": "2025-06-03T04:00:33.957195+00:00"} {"global_step": 230565, "acc_step": 0, "speed/wps": 5523.857740856573, "speed/FLOPS": 244126238478872.84, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.047309812158346176, "optim/lr": 2.9924390897110965e-05, "optim/total_tokens": 1934119403520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2871077060699463, "created_at": "2025-06-03T04:00:36.929587+00:00"} {"global_step": 230566, "acc_step": 0, "speed/wps": 5542.788775384956, "speed/FLOPS": 244962893307208.66, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 189.26, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045940548181533813, "optim/lr": 2.992084367201642e-05, "optim/total_tokens": 1934127792128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3011131286621094, "created_at": "2025-06-03T04:00:39.889723+00:00"} {"global_step": 230567, "acc_step": 0, "speed/wps": 5522.479950591197, "speed/FLOPS": 244065347201313.1, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041235677897930145, "optim/lr": 2.9917296446922093e-05, "optim/total_tokens": 1934136180736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2979075908660889, "created_at": "2025-06-03T04:00:42.865416+00:00"} {"global_step": 230568, "acc_step": 0, "speed/wps": 5521.3319040270435, "speed/FLOPS": 244014609419412.5, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04553881660103798, "optim/lr": 2.9913749221827546e-05, "optim/total_tokens": 1934144569344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.318261742591858, "created_at": "2025-06-03T04:00:45.837265+00:00"} {"global_step": 230569, "acc_step": 0, "speed/wps": 5532.717493068087, "speed/FLOPS": 244517794178299.0, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04241937771439552, "optim/lr": 2.9910201996733e-05, "optim/total_tokens": 1934152957952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.299354910850525, "created_at": "2025-06-03T04:00:48.802231+00:00"} {"global_step": 230570, "acc_step": 0, "speed/wps": 5516.554914197003, "speed/FLOPS": 243803490919775.2, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.051770713180303574, "optim/lr": 2.9906654771638453e-05, "optim/total_tokens": 1934161346560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.303992748260498, "created_at": "2025-06-03T04:00:51.779211+00:00"} {"global_step": 230571, "acc_step": 0, "speed/wps": 5516.6564773460605, "speed/FLOPS": 243807979491116.22, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042769622057676315, "optim/lr": 2.9903107546544127e-05, "optim/total_tokens": 1934169735168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.305943489074707, "created_at": "2025-06-03T04:00:54.753239+00:00"} {"global_step": 230572, "acc_step": 0, "speed/wps": 5518.501865327973, "speed/FLOPS": 243889536194364.78, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04371015354990959, "optim/lr": 2.989956032144958e-05, "optim/total_tokens": 1934178123776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3176426887512207, "created_at": "2025-06-03T04:00:57.725897+00:00"} {"global_step": 230573, "acc_step": 0, "speed/wps": 5507.964765299589, "speed/FLOPS": 243423850306877.38, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042475149035453796, "optim/lr": 2.9896013096355035e-05, "optim/total_tokens": 1934186512384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3134996891021729, "created_at": "2025-06-03T04:01:00.704393+00:00"} {"global_step": 230574, "acc_step": 0, "speed/wps": 5537.944779294225, "speed/FLOPS": 244748813473817.94, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 189.44, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04109736904501915, "optim/lr": 2.9892465871260488e-05, "optim/total_tokens": 1934194900992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3076993227005005, "created_at": "2025-06-03T04:01:03.667410+00:00"} {"global_step": 230575, "acc_step": 0, "speed/wps": 5512.24293363374, "speed/FLOPS": 243612923449596.25, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04285239055752754, "optim/lr": 2.9888918646166162e-05, "optim/total_tokens": 1934203289600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3145464658737183, "created_at": "2025-06-03T04:01:06.643572+00:00"} {"global_step": 230576, "acc_step": 0, "speed/wps": 5505.211306008529, "speed/FLOPS": 243302161499694.8, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.96 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.96, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04410931095480919, "optim/lr": 2.9885371421071616e-05, "optim/total_tokens": 1934211678208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3038839101791382, "created_at": "2025-06-03T04:01:09.623851+00:00"} {"global_step": 230577, "acc_step": 0, "speed/wps": 5518.0276461086, "speed/FLOPS": 243868578132142.5, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04278916120529175, "optim/lr": 2.988182419597707e-05, "optim/total_tokens": 1934220066816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3072470426559448, "created_at": "2025-06-03T04:01:12.596815+00:00"} {"global_step": 230578, "acc_step": 0, "speed/wps": 5526.275751606259, "speed/FLOPS": 244233102177508.0, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04029249772429466, "optim/lr": 2.9878276970882523e-05, "optim/total_tokens": 1934228455424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2993139028549194, "created_at": "2025-06-03T04:01:15.566898+00:00"} {"global_step": 230579, "acc_step": 0, "speed/wps": 5515.592132646095, "speed/FLOPS": 243760940903187.75, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04128590226173401, "optim/lr": 2.98747297457882e-05, "optim/total_tokens": 1934236844032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3025768995285034, "created_at": "2025-06-03T04:01:18.541297+00:00"} {"global_step": 230580, "acc_step": 0, "speed/wps": 5513.449794281795, "speed/FLOPS": 243666260512967.5, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0437561459839344, "optim/lr": 2.987118252069365e-05, "optim/total_tokens": 1934245232640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3073992729187012, "created_at": "2025-06-03T04:01:21.517807+00:00"} {"global_step": 230581, "acc_step": 0, "speed/wps": 5512.87153199086, "speed/FLOPS": 243640704279522.88, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.95 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.95, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04081733152270317, "optim/lr": 2.9867635295599104e-05, "optim/total_tokens": 1934253621248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2941536903381348, "created_at": "2025-06-03T04:01:24.497004+00:00"} {"global_step": 230582, "acc_step": 0, "speed/wps": 5520.305842575441, "speed/FLOPS": 243969262755110.28, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.94 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.94, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042248260229825974, "optim/lr": 2.9864088070504557e-05, "optim/total_tokens": 1934262009856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3160127401351929, "created_at": "2025-06-03T04:01:27.468780+00:00"} {"global_step": 230583, "acc_step": 0, "speed/wps": 5522.084892655685, "speed/FLOPS": 244047887662653.25, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.94 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.94, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04112531617283821, "optim/lr": 2.9860540845410235e-05, "optim/total_tokens": 1934270398464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3056715726852417, "created_at": "2025-06-03T04:01:30.439805+00:00"} {"global_step": 230584, "acc_step": 0, "speed/wps": 5520.24563382196, "speed/FLOPS": 243966601836382.75, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.94 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.94, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04044245555996895, "optim/lr": 2.9856993620315688e-05, "optim/total_tokens": 1934278787072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.302865743637085, "created_at": "2025-06-03T04:01:33.411563+00:00"} {"global_step": 230585, "acc_step": 0, "speed/wps": 5522.448420084323, "speed/FLOPS": 244063953714297.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040965814143419266, "optim/lr": 2.985344639522114e-05, "optim/total_tokens": 1934287175680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3129562139511108, "created_at": "2025-06-03T04:01:36.383820+00:00"} {"global_step": 230586, "acc_step": 0, "speed/wps": 5522.526065992748, "speed/FLOPS": 244067385266021.62, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04132963344454765, "optim/lr": 2.9849899170126592e-05, "optim/total_tokens": 1934295564288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3043406009674072, "created_at": "2025-06-03T04:01:39.355635+00:00"} {"global_step": 230587, "acc_step": 0, "speed/wps": 5527.008315622185, "speed/FLOPS": 244265477757409.38, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04205477982759476, "optim/lr": 2.984635194503227e-05, "optim/total_tokens": 1934303952896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3046953678131104, "created_at": "2025-06-03T04:01:42.323552+00:00"} {"global_step": 230588, "acc_step": 0, "speed/wps": 5522.25730572968, "speed/FLOPS": 244055507438033.75, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041987184435129166, "optim/lr": 2.9842804719937723e-05, "optim/total_tokens": 1934312341504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.317798137664795, "created_at": "2025-06-03T04:01:45.294590+00:00"} {"global_step": 230589, "acc_step": 0, "speed/wps": 5520.529531505605, "speed/FLOPS": 243979148660879.78, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040568944066762924, "optim/lr": 2.9839257494843176e-05, "optim/total_tokens": 1934320730112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.300690770149231, "created_at": "2025-06-03T04:01:48.266356+00:00"} {"global_step": 230590, "acc_step": 0, "speed/wps": 5512.483967861345, "speed/FLOPS": 243623575928731.38, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.94 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.94, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041795194149017334, "optim/lr": 2.9835710269748627e-05, "optim/total_tokens": 1934329118720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2942187786102295, "created_at": "2025-06-03T04:01:51.242512+00:00"} {"global_step": 230591, "acc_step": 0, "speed/wps": 5524.738672234503, "speed/FLOPS": 244165171136761.78, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04075003042817116, "optim/lr": 2.9832163044654304e-05, "optim/total_tokens": 1934337507328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2999650239944458, "created_at": "2025-06-03T04:01:54.213287+00:00"} {"global_step": 230592, "acc_step": 0, "speed/wps": 5523.3260120452205, "speed/FLOPS": 244102738787045.84, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041388463228940964, "optim/lr": 2.9828615819559758e-05, "optim/total_tokens": 1934345895936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.296457290649414, "created_at": "2025-06-03T04:01:57.182967+00:00"} {"global_step": 230593, "acc_step": 0, "speed/wps": 5532.553850964119, "speed/FLOPS": 244510562034899.84, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04155854508280754, "optim/lr": 2.982506859446521e-05, "optim/total_tokens": 1934354284544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2933738231658936, "created_at": "2025-06-03T04:02:00.151032+00:00"} {"global_step": 230594, "acc_step": 0, "speed/wps": 5534.810774764864, "speed/FLOPS": 244610306514909.53, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04092126712203026, "optim/lr": 2.9821521369370885e-05, "optim/total_tokens": 1934362673152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3069053888320923, "created_at": "2025-06-03T04:02:03.118434+00:00"} {"global_step": 230595, "acc_step": 0, "speed/wps": 5520.890033931089, "speed/FLOPS": 243995081022867.53, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.043586526066064835, "optim/lr": 2.981797414427634e-05, "optim/total_tokens": 1934371061760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2978708744049072, "created_at": "2025-06-03T04:02:06.094456+00:00"} {"global_step": 230596, "acc_step": 0, "speed/wps": 5517.559579008368, "speed/FLOPS": 243847891962096.84, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05571764335036278, "optim/lr": 2.9814426919181792e-05, "optim/total_tokens": 1934379450368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3077824115753174, "created_at": "2025-06-03T04:02:09.067617+00:00"} {"global_step": 230597, "acc_step": 0, "speed/wps": 5514.888325592446, "speed/FLOPS": 243729836233827.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04215781018137932, "optim/lr": 2.9810879694087246e-05, "optim/total_tokens": 1934387838976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2807496786117554, "created_at": "2025-06-03T04:02:12.046172+00:00"} {"global_step": 230598, "acc_step": 0, "speed/wps": 5510.711306973916, "speed/FLOPS": 243545233390807.97, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.94 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.94, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.051576171070337296, "optim/lr": 2.980733246899292e-05, "optim/total_tokens": 1934396227584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3097580671310425, "created_at": "2025-06-03T04:02:15.027454+00:00"} {"global_step": 230599, "acc_step": 0, "speed/wps": 5512.954728320645, "speed/FLOPS": 243644381131461.97, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04419291764497757, "optim/lr": 2.9803785243898373e-05, "optim/total_tokens": 1934404616192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3013226985931396, "created_at": "2025-06-03T04:02:18.006900+00:00"} {"global_step": 230600, "acc_step": 0, "speed/wps": 5524.435155103993, "speed/FLOPS": 244151757233134.75, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04396321251988411, "optim/lr": 2.9800238018803827e-05, "optim/total_tokens": 1934413004800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3100366592407227, "created_at": "2025-06-03T04:02:20.977672+00:00"} {"global_step": 230601, "acc_step": 0, "speed/wps": 5540.678418895522, "speed/FLOPS": 244869626352159.38, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 189.36, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04449543356895447, "optim/lr": 2.979669079370928e-05, "optim/total_tokens": 1934421393408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.298744797706604, "created_at": "2025-06-03T04:02:23.941209+00:00"} {"global_step": 230602, "acc_step": 0, "speed/wps": 5519.374306236377, "speed/FLOPS": 243928093616958.88, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04223393276333809, "optim/lr": 2.9793143568614954e-05, "optim/total_tokens": 1934429782016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.287398099899292, "created_at": "2025-06-03T04:02:26.913437+00:00"} {"global_step": 230603, "acc_step": 0, "speed/wps": 5520.478605808998, "speed/FLOPS": 243976898005751.1, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.044489745050668716, "optim/lr": 2.9789596343520408e-05, "optim/total_tokens": 1934438170624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3228042125701904, "created_at": "2025-06-03T04:02:29.885978+00:00"} {"global_step": 230604, "acc_step": 0, "speed/wps": 5521.412710594092, "speed/FLOPS": 244018180656070.53, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041452135890722275, "optim/lr": 2.978604911842586e-05, "optim/total_tokens": 1934446559232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2815642356872559, "created_at": "2025-06-03T04:02:32.860662+00:00"} {"global_step": 230605, "acc_step": 0, "speed/wps": 5516.200248374339, "speed/FLOPS": 243787816505757.7, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04250958561897278, "optim/lr": 2.9782501893331315e-05, "optim/total_tokens": 1934454947840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3167963027954102, "created_at": "2025-06-03T04:02:35.838396+00:00"} {"global_step": 230606, "acc_step": 0, "speed/wps": 5514.26585564542, "speed/FLOPS": 243702326248259.0, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.93 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.93, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042165953665971756, "optim/lr": 2.977895466823699e-05, "optim/total_tokens": 1934463336448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.306549072265625, "created_at": "2025-06-03T04:02:38.813831+00:00"} {"global_step": 230607, "acc_step": 0, "speed/wps": 5525.773917752911, "speed/FLOPS": 244210923689808.5, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041126422584056854, "optim/lr": 2.9775407443142443e-05, "optim/total_tokens": 1934471725056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.311396837234497, "created_at": "2025-06-03T04:02:41.786120+00:00"} {"global_step": 230608, "acc_step": 0, "speed/wps": 5526.745738475146, "speed/FLOPS": 244253873191501.9, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04155868664383888, "optim/lr": 2.9771860218047896e-05, "optim/total_tokens": 1934480113664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2925411462783813, "created_at": "2025-06-03T04:02:44.754354+00:00"} {"global_step": 230609, "acc_step": 0, "speed/wps": 5519.336065628927, "speed/FLOPS": 243926403577842.75, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04266371205449104, "optim/lr": 2.976831299295335e-05, "optim/total_tokens": 1934488502272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.299349308013916, "created_at": "2025-06-03T04:02:47.727755+00:00"} {"global_step": 230610, "acc_step": 0, "speed/wps": 5526.978045686803, "speed/FLOPS": 244264139981201.06, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04144233465194702, "optim/lr": 2.9764765767859027e-05, "optim/total_tokens": 1934496890880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.307732105255127, "created_at": "2025-06-03T04:02:50.701032+00:00"} {"global_step": 230611, "acc_step": 0, "speed/wps": 5518.031502343003, "speed/FLOPS": 243868748557965.12, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04147680848836899, "optim/lr": 2.9761218542764477e-05, "optim/total_tokens": 1934505279488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2878824472427368, "created_at": "2025-06-03T04:02:53.675148+00:00"} {"global_step": 230612, "acc_step": 0, "speed/wps": 5522.0994580369625, "speed/FLOPS": 244048531377953.34, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0422041080892086, "optim/lr": 2.975767131766993e-05, "optim/total_tokens": 1934513668096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2945830821990967, "created_at": "2025-06-03T04:02:56.646017+00:00"} {"global_step": 230613, "acc_step": 0, "speed/wps": 5519.42446434063, "speed/FLOPS": 243930310348434.4, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041356898844242096, "optim/lr": 2.9754124092575384e-05, "optim/total_tokens": 1934522056704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.291450023651123, "created_at": "2025-06-03T04:02:59.618334+00:00"} {"global_step": 230614, "acc_step": 0, "speed/wps": 5514.7573577548055, "speed/FLOPS": 243724048125758.0, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04197029024362564, "optim/lr": 2.975057686748106e-05, "optim/total_tokens": 1934530445312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.298032283782959, "created_at": "2025-06-03T04:03:02.596718+00:00"} {"global_step": 230615, "acc_step": 0, "speed/wps": 5515.999997139185, "speed/FLOPS": 243778966426142.62, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04101467505097389, "optim/lr": 2.9747029642386515e-05, "optim/total_tokens": 1934538833920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2848464250564575, "created_at": "2025-06-03T04:03:05.572537+00:00"} {"global_step": 230616, "acc_step": 0, "speed/wps": 5516.348877565982, "speed/FLOPS": 243794385155275.12, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041523512452840805, "optim/lr": 2.9743482417291965e-05, "optim/total_tokens": 1934547222528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3014253377914429, "created_at": "2025-06-03T04:03:08.547358+00:00"} {"global_step": 230617, "acc_step": 0, "speed/wps": 5544.016544909365, "speed/FLOPS": 245017154435893.4, "speed/curr_iter_time": 2.9544, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9544, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 189.26, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045351795852184296, "optim/lr": 2.973993519219742e-05, "optim/total_tokens": 1934555611136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2895458936691284, "created_at": "2025-06-03T04:03:11.506764+00:00"} {"global_step": 230618, "acc_step": 0, "speed/wps": 5524.414987390315, "speed/FLOPS": 244150865923417.9, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04100312665104866, "optim/lr": 2.9736387967103096e-05, "optim/total_tokens": 1934563999744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2845200300216675, "created_at": "2025-06-03T04:03:14.477204+00:00"} {"global_step": 230619, "acc_step": 0, "speed/wps": 5521.825275415505, "speed/FLOPS": 244036413909478.8, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04095832258462906, "optim/lr": 2.973284074200855e-05, "optim/total_tokens": 1934572388352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2908979654312134, "created_at": "2025-06-03T04:03:17.450549+00:00"} {"global_step": 230620, "acc_step": 0, "speed/wps": 5523.41784050213, "speed/FLOPS": 244106797134820.6, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04047480598092079, "optim/lr": 2.9729293516914003e-05, "optim/total_tokens": 1934580776960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.284760594367981, "created_at": "2025-06-03T04:03:20.421030+00:00"} {"global_step": 230621, "acc_step": 0, "speed/wps": 5509.475262139478, "speed/FLOPS": 243490606535776.78, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.92 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.92, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04463164880871773, "optim/lr": 2.9725746291819677e-05, "optim/total_tokens": 1934589165568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.301741123199463, "created_at": "2025-06-03T04:03:23.401220+00:00"} {"global_step": 230622, "acc_step": 0, "speed/wps": 5517.295444791237, "speed/FLOPS": 243836218581661.16, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045019861310720444, "optim/lr": 2.972219906672513e-05, "optim/total_tokens": 1934597554176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.301551342010498, "created_at": "2025-06-03T04:03:26.374684+00:00"} {"global_step": 230623, "acc_step": 0, "speed/wps": 5526.932830889515, "speed/FLOPS": 244262141718591.22, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0423913337290287, "optim/lr": 2.9718651841630585e-05, "optim/total_tokens": 1934605942784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2892791032791138, "created_at": "2025-06-03T04:03:29.345842+00:00"} {"global_step": 230624, "acc_step": 0, "speed/wps": 5535.1447468514225, "speed/FLOPS": 244625066371711.3, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04453440010547638, "optim/lr": 2.9715104616536038e-05, "optim/total_tokens": 1934614331392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2878645658493042, "created_at": "2025-06-03T04:03:32.316465+00:00"} {"global_step": 230625, "acc_step": 0, "speed/wps": 5538.540941233791, "speed/FLOPS": 244775160780113.34, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 189.38, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042436860501766205, "optim/lr": 2.9711557391441712e-05, "optim/total_tokens": 1934622720000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3081557750701904, "created_at": "2025-06-03T04:03:35.281688+00:00"} {"global_step": 230626, "acc_step": 0, "speed/wps": 5531.751779151211, "speed/FLOPS": 244475114566145.0, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042221929877996445, "optim/lr": 2.9708010166347166e-05, "optim/total_tokens": 1934631108608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.296749234199524, "created_at": "2025-06-03T04:03:38.248385+00:00"} {"global_step": 230627, "acc_step": 0, "speed/wps": 5520.311707058683, "speed/FLOPS": 243969521935252.44, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04351557791233063, "optim/lr": 2.970446294125262e-05, "optim/total_tokens": 1934639497216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3000195026397705, "created_at": "2025-06-03T04:03:41.223217+00:00"} {"global_step": 230628, "acc_step": 0, "speed/wps": 5524.521670502411, "speed/FLOPS": 244155580770918.9, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04183201119303703, "optim/lr": 2.9700915716158073e-05, "optim/total_tokens": 1934647885824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3075059652328491, "created_at": "2025-06-03T04:03:44.196721+00:00"} {"global_step": 230629, "acc_step": 0, "speed/wps": 5522.336618232321, "speed/FLOPS": 244059012644692.28, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04550234600901604, "optim/lr": 2.9697368491063747e-05, "optim/total_tokens": 1934656274432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.300806999206543, "created_at": "2025-06-03T04:03:47.171242+00:00"} {"global_step": 230630, "acc_step": 0, "speed/wps": 5529.70295274844, "speed/FLOPS": 244384566925986.72, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.049065425992012024, "optim/lr": 2.96938212659692e-05, "optim/total_tokens": 1934664663040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3040565252304077, "created_at": "2025-06-03T04:03:50.143036+00:00"} {"global_step": 230631, "acc_step": 0, "speed/wps": 5515.238500520371, "speed/FLOPS": 243745312173284.1, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0416007861495018, "optim/lr": 2.9690274040874654e-05, "optim/total_tokens": 1934673051648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3021516799926758, "created_at": "2025-06-03T04:03:53.117962+00:00"} {"global_step": 230632, "acc_step": 0, "speed/wps": 5521.72810727633, "speed/FLOPS": 244032119575078.9, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042858969420194626, "optim/lr": 2.9686726815780107e-05, "optim/total_tokens": 1934681440256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3110114336013794, "created_at": "2025-06-03T04:03:56.091141+00:00"} {"global_step": 230633, "acc_step": 0, "speed/wps": 5531.8096164871085, "speed/FLOPS": 244477670680353.34, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 189.7, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.039820779114961624, "optim/lr": 2.968317959068578e-05, "optim/total_tokens": 1934689828864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3053181171417236, "created_at": "2025-06-03T04:03:59.059168+00:00"} {"global_step": 230634, "acc_step": 0, "speed/wps": 5518.860238332248, "speed/FLOPS": 243905374446834.4, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.045136433094739914, "optim/lr": 2.9679632365591235e-05, "optim/total_tokens": 1934698217472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3044044971466064, "created_at": "2025-06-03T04:04:02.036155+00:00"} {"global_step": 230635, "acc_step": 0, "speed/wps": 5515.014920306357, "speed/FLOPS": 243735431072211.94, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04059542343020439, "optim/lr": 2.967608514049669e-05, "optim/total_tokens": 1934706606080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3081449270248413, "created_at": "2025-06-03T04:04:05.010784+00:00"} {"global_step": 230636, "acc_step": 0, "speed/wps": 5514.719058357021, "speed/FLOPS": 243722355488410.0, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042919691652059555, "optim/lr": 2.9672537915402142e-05, "optim/total_tokens": 1934714994688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.305307149887085, "created_at": "2025-06-03T04:04:07.988793+00:00"} {"global_step": 230637, "acc_step": 0, "speed/wps": 5514.606039813453, "speed/FLOPS": 243717360647265.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04088915139436722, "optim/lr": 2.966899069030782e-05, "optim/total_tokens": 1934723383296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3100587129592896, "created_at": "2025-06-03T04:04:10.966914+00:00"} {"global_step": 230638, "acc_step": 0, "speed/wps": 5512.830834170888, "speed/FLOPS": 243638905644190.47, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0411292165517807, "optim/lr": 2.966544346521327e-05, "optim/total_tokens": 1934731771904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.301184058189392, "created_at": "2025-06-03T04:04:13.943490+00:00"} {"global_step": 230639, "acc_step": 0, "speed/wps": 5518.8953381709525, "speed/FLOPS": 243906925680047.9, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04498303681612015, "optim/lr": 2.9661896240118723e-05, "optim/total_tokens": 1934740160512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2947899103164673, "created_at": "2025-06-03T04:04:16.916230+00:00"} {"global_step": 230640, "acc_step": 0, "speed/wps": 5517.0991138703375, "speed/FLOPS": 243827541759870.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041281409561634064, "optim/lr": 2.9658349015024177e-05, "optim/total_tokens": 1934748549120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.296860694885254, "created_at": "2025-06-03T04:04:19.893832+00:00"} {"global_step": 230641, "acc_step": 0, "speed/wps": 5502.530433874366, "speed/FLOPS": 243183680673312.3, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.91 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.91, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04424619302153587, "optim/lr": 2.9654801789929854e-05, "optim/total_tokens": 1934756937728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.304719090461731, "created_at": "2025-06-03T04:04:22.875534+00:00"} {"global_step": 230642, "acc_step": 0, "speed/wps": 5540.754607638666, "speed/FLOPS": 244872993504637.0, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.33, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04189375787973404, "optim/lr": 2.9651254564835308e-05, "optim/total_tokens": 1934765326336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.300191044807434, "created_at": "2025-06-03T04:04:25.839929+00:00"} {"global_step": 230643, "acc_step": 0, "speed/wps": 5532.063849058857, "speed/FLOPS": 244488906458744.38, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.043310925364494324, "optim/lr": 2.9647707339740758e-05, "optim/total_tokens": 1934773714944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3095767498016357, "created_at": "2025-06-03T04:04:28.805352+00:00"} {"global_step": 230644, "acc_step": 0, "speed/wps": 5526.365729902123, "speed/FLOPS": 244237078757634.5, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04475456103682518, "optim/lr": 2.964416011464621e-05, "optim/total_tokens": 1934782103552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3078359365463257, "created_at": "2025-06-03T04:04:31.779131+00:00"} {"global_step": 230645, "acc_step": 0, "speed/wps": 5520.642562563694, "speed/FLOPS": 243984144055101.9, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0421726293861866, "optim/lr": 2.964061288955189e-05, "optim/total_tokens": 1934790492160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2964290380477905, "created_at": "2025-06-03T04:04:34.750797+00:00"} {"global_step": 230646, "acc_step": 0, "speed/wps": 5528.455666063003, "speed/FLOPS": 244329443238682.4, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04887206852436066, "optim/lr": 2.9637065664457342e-05, "optim/total_tokens": 1934798880768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2887804508209229, "created_at": "2025-06-03T04:04:37.718349+00:00"} {"global_step": 230647, "acc_step": 0, "speed/wps": 5521.413288958996, "speed/FLOPS": 244018206216838.97, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04907060042023659, "optim/lr": 2.9633518439362796e-05, "optim/total_tokens": 1934807269376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2943156957626343, "created_at": "2025-06-03T04:04:40.691482+00:00"} {"global_step": 230648, "acc_step": 0, "speed/wps": 5529.275291350992, "speed/FLOPS": 244365666481188.97, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04573525860905647, "optim/lr": 2.962997121426847e-05, "optim/total_tokens": 1934815657984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3228167295455933, "created_at": "2025-06-03T04:04:43.658914+00:00"} {"global_step": 230649, "acc_step": 0, "speed/wps": 5530.3021649412285, "speed/FLOPS": 244411049037861.94, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05705352500081062, "optim/lr": 2.9626423989173923e-05, "optim/total_tokens": 1934824046592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2997537851333618, "created_at": "2025-06-03T04:04:46.628394+00:00"} {"global_step": 230650, "acc_step": 0, "speed/wps": 5521.961894255651, "speed/FLOPS": 244042451762934.66, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042803455144166946, "optim/lr": 2.9622876764079377e-05, "optim/total_tokens": 1934832435200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3136014938354492, "created_at": "2025-06-03T04:04:49.604493+00:00"} {"global_step": 230651, "acc_step": 0, "speed/wps": 5521.714499668281, "speed/FLOPS": 244031518188453.2, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.050865862518548965, "optim/lr": 2.961932953898483e-05, "optim/total_tokens": 1934840823808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.308880090713501, "created_at": "2025-06-03T04:04:52.576406+00:00"} {"global_step": 230652, "acc_step": 0, "speed/wps": 5530.055347548565, "speed/FLOPS": 244400140972432.12, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04403533414006233, "optim/lr": 2.9615782313890504e-05, "optim/total_tokens": 1934849212416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3038979768753052, "created_at": "2025-06-03T04:04:55.546341+00:00"} {"global_step": 230653, "acc_step": 0, "speed/wps": 5522.772001513261, "speed/FLOPS": 244078254357216.2, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04730797931551933, "optim/lr": 2.9612235088795958e-05, "optim/total_tokens": 1934857601024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2884670495986938, "created_at": "2025-06-03T04:04:58.519762+00:00"} {"global_step": 230654, "acc_step": 0, "speed/wps": 5520.762213004131, "speed/FLOPS": 243989431992142.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04550595209002495, "optim/lr": 2.960868786370141e-05, "optim/total_tokens": 1934865989632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3117637634277344, "created_at": "2025-06-03T04:05:01.496569+00:00"} {"global_step": 230655, "acc_step": 0, "speed/wps": 5513.552176678284, "speed/FLOPS": 243670785290851.72, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04730251803994179, "optim/lr": 2.9605140638606865e-05, "optim/total_tokens": 1934874378240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.296332597732544, "created_at": "2025-06-03T04:05:04.475744+00:00"} {"global_step": 230656, "acc_step": 0, "speed/wps": 5504.73590465488, "speed/FLOPS": 243281151193188.22, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.9 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.9, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05016295611858368, "optim/lr": 2.960159341351254e-05, "optim/total_tokens": 1934882766848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.295032262802124, "created_at": "2025-06-03T04:05:07.456348+00:00"} {"global_step": 230657, "acc_step": 0, "speed/wps": 5513.217032019188, "speed/FLOPS": 243655973612345.53, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04266577214002609, "optim/lr": 2.9598046188417993e-05, "optim/total_tokens": 1934891155456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3141884803771973, "created_at": "2025-06-03T04:05:10.432051+00:00"} {"global_step": 230658, "acc_step": 0, "speed/wps": 5526.564965769513, "speed/FLOPS": 244245883963191.53, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04652755707502365, "optim/lr": 2.9594498963323446e-05, "optim/total_tokens": 1934899544064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3009494543075562, "created_at": "2025-06-03T04:05:13.400578+00:00"} {"global_step": 230659, "acc_step": 0, "speed/wps": 5527.833186858287, "speed/FLOPS": 244301932843971.34, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04522353783249855, "optim/lr": 2.95909517382289e-05, "optim/total_tokens": 1934907932672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3034828901290894, "created_at": "2025-06-03T04:05:16.368390+00:00"} {"global_step": 230660, "acc_step": 0, "speed/wps": 5529.84402174001, "speed/FLOPS": 244390801453357.56, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05540180206298828, "optim/lr": 2.9587404513134574e-05, "optim/total_tokens": 1934916321280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3033031225204468, "created_at": "2025-06-03T04:05:19.335524+00:00"} {"global_step": 230661, "acc_step": 0, "speed/wps": 5526.679393934361, "speed/FLOPS": 244250941102381.34, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04038034379482269, "optim/lr": 2.9583857288040027e-05, "optim/total_tokens": 1934924709888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2996718883514404, "created_at": "2025-06-03T04:05:22.306645+00:00"} {"global_step": 230662, "acc_step": 0, "speed/wps": 5523.497657189892, "speed/FLOPS": 244110324623880.84, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04810786992311478, "optim/lr": 2.958031006294548e-05, "optim/total_tokens": 1934933098496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2919214963912964, "created_at": "2025-06-03T04:05:25.278857+00:00"} {"global_step": 230663, "acc_step": 0, "speed/wps": 5517.137474017993, "speed/FLOPS": 243829237082051.47, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041682105511426926, "optim/lr": 2.9576762837850934e-05, "optim/total_tokens": 1934941487104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2891290187835693, "created_at": "2025-06-03T04:05:28.252501+00:00"} {"global_step": 230664, "acc_step": 0, "speed/wps": 5501.119128901595, "speed/FLOPS": 243121308217229.5, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05315135046839714, "optim/lr": 2.9573215612756608e-05, "optim/total_tokens": 1934949875712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3138290643692017, "created_at": "2025-06-03T04:05:31.239246+00:00"} {"global_step": 230665, "acc_step": 0, "speed/wps": 5512.391052555782, "speed/FLOPS": 243619469547809.16, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04207761213183403, "optim/lr": 2.9569668387662062e-05, "optim/total_tokens": 1934958264320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.270080327987671, "created_at": "2025-06-03T04:05:34.215698+00:00"} {"global_step": 230666, "acc_step": 0, "speed/wps": 5535.165679597232, "speed/FLOPS": 244625991491932.6, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 189.54, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.052868906408548355, "optim/lr": 2.9566121162567515e-05, "optim/total_tokens": 1934966652928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3004114627838135, "created_at": "2025-06-03T04:05:37.179495+00:00"} {"global_step": 230667, "acc_step": 0, "speed/wps": 5524.78638343829, "speed/FLOPS": 244167279727761.1, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0434323288500309, "optim/lr": 2.956257393747297e-05, "optim/total_tokens": 1934975041536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3125485181808472, "created_at": "2025-06-03T04:05:40.152012+00:00"} {"global_step": 230668, "acc_step": 0, "speed/wps": 5531.450185926069, "speed/FLOPS": 244461785689287.78, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042911455035209656, "optim/lr": 2.9559026712378646e-05, "optim/total_tokens": 1934983430144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3006376028060913, "created_at": "2025-06-03T04:05:43.117765+00:00"} {"global_step": 230669, "acc_step": 0, "speed/wps": 5520.5535089656605, "speed/FLOPS": 243980208341886.47, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04315459355711937, "optim/lr": 2.9555479487284097e-05, "optim/total_tokens": 1934991818752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3134653568267822, "created_at": "2025-06-03T04:05:46.092254+00:00"} {"global_step": 230670, "acc_step": 0, "speed/wps": 5527.741840290042, "speed/FLOPS": 244297895793209.03, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04528737813234329, "optim/lr": 2.955193226218955e-05, "optim/total_tokens": 1935000207360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2960351705551147, "created_at": "2025-06-03T04:05:49.063532+00:00"} {"global_step": 230671, "acc_step": 0, "speed/wps": 5527.985623278625, "speed/FLOPS": 244308669753509.97, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04657013341784477, "optim/lr": 2.9548385037095004e-05, "optim/total_tokens": 1935008595968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3054015636444092, "created_at": "2025-06-03T04:05:52.035845+00:00"} {"global_step": 230672, "acc_step": 0, "speed/wps": 5499.646771099434, "speed/FLOPS": 243056237538584.38, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04575498774647713, "optim/lr": 2.954483781200068e-05, "optim/total_tokens": 1935016984576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.291795015335083, "created_at": "2025-06-03T04:05:55.024139+00:00"} {"global_step": 230673, "acc_step": 0, "speed/wps": 5506.8759239521905, "speed/FLOPS": 243375729092517.6, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.88 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.88, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.05034628510475159, "optim/lr": 2.9541290586906135e-05, "optim/total_tokens": 1935025373184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3136223554611206, "created_at": "2025-06-03T04:05:58.003876+00:00"} {"global_step": 230674, "acc_step": 0, "speed/wps": 5501.434554968327, "speed/FLOPS": 243135248434882.06, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.89 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.89, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04225647822022438, "optim/lr": 2.9537743361811588e-05, "optim/total_tokens": 1935033761792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3028349876403809, "created_at": "2025-06-03T04:06:00.985807+00:00"} {"global_step": 230675, "acc_step": 0, "speed/wps": 5531.302813187849, "speed/FLOPS": 244455272568580.53, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.048798151314258575, "optim/lr": 2.953419613671704e-05, "optim/total_tokens": 1935042150400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3152368068695068, "created_at": "2025-06-03T04:06:03.956214+00:00"} {"global_step": 230676, "acc_step": 0, "speed/wps": 5515.184094615167, "speed/FLOPS": 243742907710748.72, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04151526093482971, "optim/lr": 2.9530648911622716e-05, "optim/total_tokens": 1935050539008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2952382564544678, "created_at": "2025-06-03T04:06:06.936312+00:00"} {"global_step": 230677, "acc_step": 0, "speed/wps": 5514.135433287064, "speed/FLOPS": 243696562247581.84, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.87 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.87, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.0419464111328125, "optim/lr": 2.952710168652817e-05, "optim/total_tokens": 1935058927616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2987313270568848, "created_at": "2025-06-03T04:06:09.911227+00:00"} {"global_step": 230678, "acc_step": 0, "speed/wps": 5533.966715067107, "speed/FLOPS": 244573003396557.84, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04069213196635246, "optim/lr": 2.9523554461433623e-05, "optim/total_tokens": 1935067316224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.3073338270187378, "created_at": "2025-06-03T04:06:12.879529+00:00"} {"global_step": 230679, "acc_step": 0, "speed/wps": 5525.970689954866, "speed/FLOPS": 244219620013963.5, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04344475269317627, "optim/lr": 2.9520007236339297e-05, "optim/total_tokens": 1935075704832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2983945608139038, "created_at": "2025-06-03T04:06:15.849183+00:00"} {"global_step": 230680, "acc_step": 0, "speed/wps": 5526.888960780186, "speed/FLOPS": 244260202884306.47, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04341345280408859, "optim/lr": 2.951646001124475e-05, "optim/total_tokens": 1935084093440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3066684007644653, "created_at": "2025-06-03T04:06:18.817300+00:00"} {"global_step": 230681, "acc_step": 0, "speed/wps": 5514.690964921367, "speed/FLOPS": 243721113902349.34, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04184071719646454, "optim/lr": 2.9512912786150204e-05, "optim/total_tokens": 1935092482048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3097797632217407, "created_at": "2025-06-03T04:06:21.794464+00:00"} {"global_step": 230682, "acc_step": 0, "speed/wps": 5512.264116247785, "speed/FLOPS": 243613859612714.6, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041739799082279205, "optim/lr": 2.9509365561055657e-05, "optim/total_tokens": 1935100870656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3043421506881714, "created_at": "2025-06-03T04:06:24.776656+00:00"} {"global_step": 230683, "acc_step": 0, "speed/wps": 5530.090489542054, "speed/FLOPS": 244401694068671.3, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.040429431945085526, "optim/lr": 2.950581833596133e-05, "optim/total_tokens": 1935109259264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3049107789993286, "created_at": "2025-06-03T04:06:27.744999+00:00"} {"global_step": 230684, "acc_step": 0, "speed/wps": 5527.565405183044, "speed/FLOPS": 244290098264556.47, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04107101261615753, "optim/lr": 2.9502271110866785e-05, "optim/total_tokens": 1935117647872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3046952486038208, "created_at": "2025-06-03T04:06:30.717161+00:00"} {"global_step": 230685, "acc_step": 0, "speed/wps": 5539.383939786772, "speed/FLOPS": 244812417001297.38, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04124412685632706, "optim/lr": 2.949872388577224e-05, "optim/total_tokens": 1935126036480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3140454292297363, "created_at": "2025-06-03T04:06:33.682872+00:00"} {"global_step": 230686, "acc_step": 0, "speed/wps": 5531.187444387715, "speed/FLOPS": 244450173858125.66, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 189.69, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04102454334497452, "optim/lr": 2.9495176660677692e-05, "optim/total_tokens": 1935134425088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2909272909164429, "created_at": "2025-06-03T04:06:36.649403+00:00"} {"global_step": 230687, "acc_step": 0, "speed/wps": 5531.872059485254, "speed/FLOPS": 244480430341259.12, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041370660066604614, "optim/lr": 2.9491629435583366e-05, "optim/total_tokens": 1935142813696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3019912242889404, "created_at": "2025-06-03T04:06:39.619260+00:00"} {"global_step": 230688, "acc_step": 0, "speed/wps": 5536.5058972646575, "speed/FLOPS": 244685222252976.94, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04108982905745506, "optim/lr": 2.948808221048882e-05, "optim/total_tokens": 1935151202304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2990834712982178, "created_at": "2025-06-03T04:06:42.582916+00:00"} {"global_step": 230689, "acc_step": 0, "speed/wps": 5516.779729968055, "speed/FLOPS": 243813426626144.25, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04382946342229843, "optim/lr": 2.9484534985394273e-05, "optim/total_tokens": 1935159590912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3180421590805054, "created_at": "2025-06-03T04:06:45.556848+00:00"} {"global_step": 230690, "acc_step": 0, "speed/wps": 5512.984724342736, "speed/FLOPS": 243645706802104.8, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.86 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.86, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04329600930213928, "optim/lr": 2.9480987760299727e-05, "optim/total_tokens": 1935167979520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3014558553695679, "created_at": "2025-06-03T04:06:48.534627+00:00"} {"global_step": 230691, "acc_step": 0, "speed/wps": 5515.6330696837795, "speed/FLOPS": 243762750110718.66, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04098959267139435, "optim/lr": 2.94774405352054e-05, "optim/total_tokens": 1935176368128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.305344820022583, "created_at": "2025-06-03T04:06:51.513698+00:00"} {"global_step": 230692, "acc_step": 0, "speed/wps": 5534.872659071571, "speed/FLOPS": 244613041484513.4, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.57, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04236286133527756, "optim/lr": 2.9473893310110854e-05, "optim/total_tokens": 1935184756736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2943446636199951, "created_at": "2025-06-03T04:06:54.477726+00:00"} {"global_step": 230693, "acc_step": 0, "speed/wps": 5534.868975168469, "speed/FLOPS": 244612878674852.2, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04059655964374542, "optim/lr": 2.9470346085016308e-05, "optim/total_tokens": 1935193145344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2955834865570068, "created_at": "2025-06-03T04:06:57.445103+00:00"} {"global_step": 230694, "acc_step": 0, "speed/wps": 5530.23682501049, "speed/FLOPS": 244408161347363.38, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041141048073768616, "optim/lr": 2.946679885992176e-05, "optim/total_tokens": 1935201533952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2952404022216797, "created_at": "2025-06-03T04:07:00.411981+00:00"} {"global_step": 230695, "acc_step": 0, "speed/wps": 5528.7457561120345, "speed/FLOPS": 244342263734034.12, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04138198494911194, "optim/lr": 2.946325163482744e-05, "optim/total_tokens": 1935209922560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2975741624832153, "created_at": "2025-06-03T04:07:03.381812+00:00"} {"global_step": 230696, "acc_step": 0, "speed/wps": 5519.501880638408, "speed/FLOPS": 243933731752543.66, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04164540022611618, "optim/lr": 2.945970440973289e-05, "optim/total_tokens": 1935218311168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3149261474609375, "created_at": "2025-06-03T04:07:06.354145+00:00"} {"global_step": 230697, "acc_step": 0, "speed/wps": 5521.971117883956, "speed/FLOPS": 244042859400094.94, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04133075848221779, "optim/lr": 2.9456157184638342e-05, "optim/total_tokens": 1935226699776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.279555082321167, "created_at": "2025-06-03T04:07:09.325317+00:00"} {"global_step": 230698, "acc_step": 0, "speed/wps": 5521.629825596452, "speed/FLOPS": 244027776027879.53, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.041529785841703415, "optim/lr": 2.9452609959543796e-05, "optim/total_tokens": 1935235088384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3035767078399658, "created_at": "2025-06-03T04:07:12.296445+00:00"} {"global_step": 230699, "acc_step": 0, "speed/wps": 5513.711376954113, "speed/FLOPS": 243677821128182.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.85 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.85, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.042403049767017365, "optim/lr": 2.9449062734449473e-05, "optim/total_tokens": 1935243476992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3127467632293701, "created_at": "2025-06-03T04:07:15.272940+00:00"} {"global_step": 230700, "acc_step": 0, "speed/wps": 5537.538844003297, "speed/FLOPS": 244730873211724.06, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.55, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04499228298664093, "optim/lr": 2.9445515509354927e-05, "optim/total_tokens": 1935251865600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.303449034690857, "created_at": "2025-06-03T04:07:18.236145+00:00"} {"global_step": 230701, "acc_step": 0, "speed/wps": 5518.932684477514, "speed/FLOPS": 243908576195642.22, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.04129888117313385, "optim/lr": 2.9441968284260377e-05, "optim/total_tokens": 1935260254208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.309970736503601, "created_at": "2025-06-03T04:07:21.208930+00:00"} {"global_step": 230702, "acc_step": 0, "speed/wps": 5515.903013152478, "speed/FLOPS": 243774680230339.22, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.29, "optim/grad_norm": 0.046484414488077164, "optim/lr": 2.943842105916583e-05, "optim/total_tokens": 1935268642816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3080072402954102, "created_at": "2025-06-03T04:07:24.183932+00:00"} {"global_step": 230703, "acc_step": 0, "speed/wps": 5521.1798624964795, "speed/FLOPS": 244007889961980.7, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04885769262909889, "optim/lr": 2.9434873834071508e-05, "optim/total_tokens": 1935277031424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3022630214691162, "created_at": "2025-06-03T04:07:27.155643+00:00"} {"global_step": 230704, "acc_step": 0, "speed/wps": 5522.795714981112, "speed/FLOPS": 244079302371118.66, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05036690831184387, "optim/lr": 2.943132660897696e-05, "optim/total_tokens": 1935285420032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2999281883239746, "created_at": "2025-06-03T04:07:30.129255+00:00"} {"global_step": 230705, "acc_step": 0, "speed/wps": 5525.825250582333, "speed/FLOPS": 244213192338123.72, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04207047075033188, "optim/lr": 2.9427779383882415e-05, "optim/total_tokens": 1935293808640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.300639271736145, "created_at": "2025-06-03T04:07:33.101297+00:00"} {"global_step": 230706, "acc_step": 0, "speed/wps": 5516.027864370966, "speed/FLOPS": 243780198015149.94, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.84 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.84, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04681781306862831, "optim/lr": 2.942423215878809e-05, "optim/total_tokens": 1935302197248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3011661767959595, "created_at": "2025-06-03T04:07:36.076636+00:00"} {"global_step": 230707, "acc_step": 0, "speed/wps": 5538.794566549485, "speed/FLOPS": 244786369720894.97, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.51, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0446016788482666, "optim/lr": 2.9420684933693543e-05, "optim/total_tokens": 1935310585856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3099827766418457, "created_at": "2025-06-03T04:07:39.042503+00:00"} {"global_step": 230708, "acc_step": 0, "speed/wps": 5533.850932227432, "speed/FLOPS": 244567886387674.53, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04255073890089989, "optim/lr": 2.9417137708598996e-05, "optim/total_tokens": 1935318974464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3139097690582275, "created_at": "2025-06-03T04:07:42.008122+00:00"} {"global_step": 230709, "acc_step": 0, "speed/wps": 5528.899978326357, "speed/FLOPS": 244349079566526.3, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.040876202285289764, "optim/lr": 2.941359048350445e-05, "optim/total_tokens": 1935327363072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.305175542831421, "created_at": "2025-06-03T04:07:44.975174+00:00"} {"global_step": 230710, "acc_step": 0, "speed/wps": 5527.443602257013, "speed/FLOPS": 244284715198669.78, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04576089233160019, "optim/lr": 2.9410043258410124e-05, "optim/total_tokens": 1935335751680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2893757820129395, "created_at": "2025-06-03T04:07:47.943326+00:00"} {"global_step": 230711, "acc_step": 0, "speed/wps": 5522.38292149583, "speed/FLOPS": 244061059011937.78, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04735945165157318, "optim/lr": 2.9406496033315577e-05, "optim/total_tokens": 1935344140288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2939889430999756, "created_at": "2025-06-03T04:07:50.915871+00:00"} {"global_step": 230712, "acc_step": 0, "speed/wps": 5531.897920753379, "speed/FLOPS": 244481573276940.3, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04153655841946602, "optim/lr": 2.940294880822103e-05, "optim/total_tokens": 1935352528896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.3056384325027466, "created_at": "2025-06-03T04:07:53.883386+00:00"} {"global_step": 230713, "acc_step": 0, "speed/wps": 5517.979912673098, "speed/FLOPS": 243866468558615.2, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0439034141600132, "optim/lr": 2.9399401583126484e-05, "optim/total_tokens": 1935360917504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3068889379501343, "created_at": "2025-06-03T04:07:56.858305+00:00"} {"global_step": 230714, "acc_step": 0, "speed/wps": 5529.874806307993, "speed/FLOPS": 244392161973692.7, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04074237123131752, "optim/lr": 2.939585435803216e-05, "optim/total_tokens": 1935369306112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.283997654914856, "created_at": "2025-06-03T04:07:59.829375+00:00"} {"global_step": 230715, "acc_step": 0, "speed/wps": 5525.161585876128, "speed/FLOPS": 244183861755053.38, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04484361410140991, "optim/lr": 2.9392307132937612e-05, "optim/total_tokens": 1935377694720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2939598560333252, "created_at": "2025-06-03T04:08:02.799712+00:00"} {"global_step": 230716, "acc_step": 0, "speed/wps": 5523.509664641951, "speed/FLOPS": 244110855291802.1, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041456855833530426, "optim/lr": 2.9388759907843066e-05, "optim/total_tokens": 1935386083328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2988585233688354, "created_at": "2025-06-03T04:08:05.772726+00:00"} {"global_step": 230717, "acc_step": 0, "speed/wps": 5524.733564349923, "speed/FLOPS": 244164945394407.88, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04643705114722252, "optim/lr": 2.938521268274852e-05, "optim/total_tokens": 1935394471936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2980310916900635, "created_at": "2025-06-03T04:08:08.741926+00:00"} {"global_step": 230718, "acc_step": 0, "speed/wps": 5527.463217666639, "speed/FLOPS": 244285582099374.5, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04817634075880051, "optim/lr": 2.9381665457654193e-05, "optim/total_tokens": 1935402860544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2940958738327026, "created_at": "2025-06-03T04:08:11.709919+00:00"} {"global_step": 230719, "acc_step": 0, "speed/wps": 5527.445071519226, "speed/FLOPS": 244284780132539.25, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04258313775062561, "optim/lr": 2.9378118232559647e-05, "optim/total_tokens": 1935411249152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3181616067886353, "created_at": "2025-06-03T04:08:14.677819+00:00"} {"global_step": 230720, "acc_step": 0, "speed/wps": 5530.064773809284, "speed/FLOPS": 244400557564907.94, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.82, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.050979889929294586, "optim/lr": 2.93745710074651e-05, "optim/total_tokens": 1935419637760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3014801740646362, "created_at": "2025-06-03T04:08:17.645245+00:00"} {"global_step": 230721, "acc_step": 0, "speed/wps": 5525.598953736641, "speed/FLOPS": 244203191175836.4, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05471978336572647, "optim/lr": 2.9371023782370554e-05, "optim/total_tokens": 1935428026368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.288804054260254, "created_at": "2025-06-03T04:08:20.614053+00:00"} {"global_step": 230722, "acc_step": 0, "speed/wps": 5547.383056274865, "speed/FLOPS": 245165937006881.28, "speed/curr_iter_time": 2.9526, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9526, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.23, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.048484910279512405, "optim/lr": 2.9367476557276228e-05, "optim/total_tokens": 1935436414976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.307782530784607, "created_at": "2025-06-03T04:08:23.571600+00:00"} {"global_step": 230723, "acc_step": 0, "speed/wps": 5508.54490328617, "speed/FLOPS": 243449489436468.84, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04782840609550476, "optim/lr": 2.936392933218168e-05, "optim/total_tokens": 1935444803584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2994827032089233, "created_at": "2025-06-03T04:08:26.549892+00:00"} {"global_step": 230724, "acc_step": 0, "speed/wps": 5518.012814022065, "speed/FLOPS": 243867922629835.16, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.82 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.82, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.044164981693029404, "optim/lr": 2.9360382107087135e-05, "optim/total_tokens": 1935453192192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2872523069381714, "created_at": "2025-06-03T04:08:29.525914+00:00"} {"global_step": 230725, "acc_step": 0, "speed/wps": 5526.308217270068, "speed/FLOPS": 244234536993674.0, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04214559867978096, "optim/lr": 2.935683488199259e-05, "optim/total_tokens": 1935461580800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2876991033554077, "created_at": "2025-06-03T04:08:32.500058+00:00"} {"global_step": 230726, "acc_step": 0, "speed/wps": 5528.211710891785, "speed/FLOPS": 244318661668790.3, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.83, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04936182498931885, "optim/lr": 2.9353287656898266e-05, "optim/total_tokens": 1935469969408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3117115497589111, "created_at": "2025-06-03T04:08:35.467785+00:00"} {"global_step": 230727, "acc_step": 0, "speed/wps": 5528.181512026881, "speed/FLOPS": 244317327033533.38, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045584384351968765, "optim/lr": 2.9349740431803716e-05, "optim/total_tokens": 1935478358016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2890844345092773, "created_at": "2025-06-03T04:08:38.435930+00:00"} {"global_step": 230728, "acc_step": 0, "speed/wps": 5526.898829442972, "speed/FLOPS": 244260639028689.22, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045657120645046234, "optim/lr": 2.934619320670917e-05, "optim/total_tokens": 1935486746624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3028345108032227, "created_at": "2025-06-03T04:08:41.405413+00:00"} {"global_step": 230729, "acc_step": 0, "speed/wps": 5526.882614363953, "speed/FLOPS": 244259922405192.84, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05174031853675842, "optim/lr": 2.9342645981614623e-05, "optim/total_tokens": 1935495135232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3087489604949951, "created_at": "2025-06-03T04:08:44.379829+00:00"} {"global_step": 230730, "acc_step": 0, "speed/wps": 5530.119484999923, "speed/FLOPS": 244402975519496.9, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.040552958846092224, "optim/lr": 2.93390987565203e-05, "optim/total_tokens": 1935503523840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2980444431304932, "created_at": "2025-06-03T04:08:47.347310+00:00"} {"global_step": 230731, "acc_step": 0, "speed/wps": 5524.317701632731, "speed/FLOPS": 244146566390886.34, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04581081122159958, "optim/lr": 2.9335551531425754e-05, "optim/total_tokens": 1935511912448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.30784010887146, "created_at": "2025-06-03T04:08:50.317059+00:00"} {"global_step": 230732, "acc_step": 0, "speed/wps": 5507.038516872969, "speed/FLOPS": 243382914867390.0, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.83 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.83, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04177000746130943, "optim/lr": 2.9332004306331208e-05, "optim/total_tokens": 1935520301056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3059906959533691, "created_at": "2025-06-03T04:08:53.296139+00:00"} {"global_step": 230733, "acc_step": 0, "speed/wps": 5519.68293582721, "speed/FLOPS": 243941733465164.22, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04240860417485237, "optim/lr": 2.932845708123688e-05, "optim/total_tokens": 1935528689664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3095499277114868, "created_at": "2025-06-03T04:08:56.268054+00:00"} {"global_step": 230734, "acc_step": 0, "speed/wps": 5539.939557692987, "speed/FLOPS": 244836972468841.8, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.5, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0419314019382, "optim/lr": 2.9324909856142335e-05, "optim/total_tokens": 1935537078272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.306201696395874, "created_at": "2025-06-03T04:08:59.229227+00:00"} {"global_step": 230735, "acc_step": 0, "speed/wps": 5536.279051902948, "speed/FLOPS": 244675196849089.16, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04209818318486214, "optim/lr": 2.932136263104779e-05, "optim/total_tokens": 1935545466880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3078603744506836, "created_at": "2025-06-03T04:09:02.192428+00:00"} {"global_step": 230736, "acc_step": 0, "speed/wps": 5518.153054375396, "speed/FLOPS": 243874120535637.2, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04121354967355728, "optim/lr": 2.9317815405953242e-05, "optim/total_tokens": 1935553855488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2958348989486694, "created_at": "2025-06-03T04:09:05.165160+00:00"} {"global_step": 230737, "acc_step": 0, "speed/wps": 5522.575194393876, "speed/FLOPS": 244069556489889.5, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04149593040347099, "optim/lr": 2.9314268180858916e-05, "optim/total_tokens": 1935562244096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.302865982055664, "created_at": "2025-06-03T04:09:08.135878+00:00"} {"global_step": 230738, "acc_step": 0, "speed/wps": 5538.068998080299, "speed/FLOPS": 244754303308353.03, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.56, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041631437838077545, "optim/lr": 2.931072095576437e-05, "optim/total_tokens": 1935570632704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.3090732097625732, "created_at": "2025-06-03T04:09:11.098250+00:00"} {"global_step": 230739, "acc_step": 0, "speed/wps": 5515.949310630921, "speed/FLOPS": 243776726341914.4, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04138345643877983, "optim/lr": 2.9307173730669823e-05, "optim/total_tokens": 1935579021312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3080406188964844, "created_at": "2025-06-03T04:09:14.073195+00:00"} {"global_step": 230740, "acc_step": 0, "speed/wps": 5531.5755923769675, "speed/FLOPS": 244467328012529.1, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04117433726787567, "optim/lr": 2.9303626505575277e-05, "optim/total_tokens": 1935587409920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.302101492881775, "created_at": "2025-06-03T04:09:17.038484+00:00"} {"global_step": 230741, "acc_step": 0, "speed/wps": 5518.496430106822, "speed/FLOPS": 243889295985409.9, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.1198476254940033, "optim/lr": 2.930007928048095e-05, "optim/total_tokens": 1935595798528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.315667986869812, "created_at": "2025-06-03T04:09:20.011270+00:00"} {"global_step": 230742, "acc_step": 0, "speed/wps": 5540.662226690833, "speed/FLOPS": 244868910739591.38, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 189.48, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04197956621646881, "optim/lr": 2.9296532055386404e-05, "optim/total_tokens": 1935604187136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3091964721679688, "created_at": "2025-06-03T04:09:22.973207+00:00"} {"global_step": 230743, "acc_step": 0, "speed/wps": 5536.865458032775, "speed/FLOPS": 244701112998528.88, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 189.56, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04158570244908333, "optim/lr": 2.9292984830291858e-05, "optim/total_tokens": 1935612575744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.319032073020935, "created_at": "2025-06-03T04:09:25.937099+00:00"} {"global_step": 230744, "acc_step": 0, "speed/wps": 5527.05820971135, "speed/FLOPS": 244267682820769.38, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04124496877193451, "optim/lr": 2.928943760519731e-05, "optim/total_tokens": 1935620964352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3007467985153198, "created_at": "2025-06-03T04:09:28.905634+00:00"} {"global_step": 230745, "acc_step": 0, "speed/wps": 5528.167005744744, "speed/FLOPS": 244316685930112.78, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04168397933244705, "optim/lr": 2.9285890380102985e-05, "optim/total_tokens": 1935629352960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3180381059646606, "created_at": "2025-06-03T04:09:31.873268+00:00"} {"global_step": 230746, "acc_step": 0, "speed/wps": 5525.633360503068, "speed/FLOPS": 244204711778802.66, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04152638837695122, "optim/lr": 2.928234315500844e-05, "optim/total_tokens": 1935637741568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.312508463859558, "created_at": "2025-06-03T04:09:34.841945+00:00"} {"global_step": 230747, "acc_step": 0, "speed/wps": 5524.663262929687, "speed/FLOPS": 244161838431468.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04106098413467407, "optim/lr": 2.9278795929913893e-05, "optim/total_tokens": 1935646130176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2895509004592896, "created_at": "2025-06-03T04:09:37.815088+00:00"} {"global_step": 230748, "acc_step": 0, "speed/wps": 5521.176401699373, "speed/FLOPS": 244007737012462.53, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04190957546234131, "optim/lr": 2.9275248704819346e-05, "optim/total_tokens": 1935654518784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2970762252807617, "created_at": "2025-06-03T04:09:40.787008+00:00"} {"global_step": 230749, "acc_step": 0, "speed/wps": 5510.802873975537, "speed/FLOPS": 243549280183597.22, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.81 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.81, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042853374034166336, "optim/lr": 2.927170147972502e-05, "optim/total_tokens": 1935662907392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3063867092132568, "created_at": "2025-06-03T04:09:43.763825+00:00"} {"global_step": 230750, "acc_step": 0, "speed/wps": 5520.776870162844, "speed/FLOPS": 243990079763535.75, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0421440452337265, "optim/lr": 2.9268154254630474e-05, "optim/total_tokens": 1935671296000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.314139485359192, "created_at": "2025-06-03T04:09:46.740959+00:00"} {"global_step": 230751, "acc_step": 0, "speed/wps": 5522.97668073031, "speed/FLOPS": 244087300130966.56, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04218903183937073, "optim/lr": 2.9264607029535927e-05, "optim/total_tokens": 1935679684608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.321502447128296, "created_at": "2025-06-03T04:09:49.711130+00:00"} {"global_step": 230752, "acc_step": 0, "speed/wps": 5522.251267666702, "speed/FLOPS": 244055240586555.72, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04395674541592598, "optim/lr": 2.926105980444138e-05, "optim/total_tokens": 1935688073216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2995589971542358, "created_at": "2025-06-03T04:09:52.681911+00:00"} {"global_step": 230753, "acc_step": 0, "speed/wps": 5519.840284287117, "speed/FLOPS": 243948687461709.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04135631397366524, "optim/lr": 2.9257512579347058e-05, "optim/total_tokens": 1935696461824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.298237919807434, "created_at": "2025-06-03T04:09:55.657756+00:00"} {"global_step": 230754, "acc_step": 0, "speed/wps": 5525.206900110497, "speed/FLOPS": 244185864412273.22, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04242810606956482, "optim/lr": 2.9253965354252508e-05, "optim/total_tokens": 1935704850432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2988590002059937, "created_at": "2025-06-03T04:09:58.627220+00:00"} {"global_step": 230755, "acc_step": 0, "speed/wps": 5522.098942362565, "speed/FLOPS": 244048508587784.47, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04175858944654465, "optim/lr": 2.9250418129157962e-05, "optim/total_tokens": 1935713239040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2896173000335693, "created_at": "2025-06-03T04:10:01.598764+00:00"} {"global_step": 230756, "acc_step": 0, "speed/wps": 5522.365482164272, "speed/FLOPS": 244060288282745.53, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04122031107544899, "optim/lr": 2.9246870904063415e-05, "optim/total_tokens": 1935721627648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3145840167999268, "created_at": "2025-06-03T04:10:04.569333+00:00"} {"global_step": 230757, "acc_step": 0, "speed/wps": 5525.847037165628, "speed/FLOPS": 244214155193591.5, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04039353132247925, "optim/lr": 2.9243323678969093e-05, "optim/total_tokens": 1935730016256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3203670978546143, "created_at": "2025-06-03T04:10:07.537992+00:00"} {"global_step": 230758, "acc_step": 0, "speed/wps": 5523.685669227155, "speed/FLOPS": 244118633793595.0, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04132729396224022, "optim/lr": 2.9239776453874546e-05, "optim/total_tokens": 1935738404864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3096569776535034, "created_at": "2025-06-03T04:10:10.507850+00:00"} {"global_step": 230759, "acc_step": 0, "speed/wps": 5520.50725846251, "speed/FLOPS": 243978164306378.78, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041189517825841904, "optim/lr": 2.9236229228779996e-05, "optim/total_tokens": 1935746793472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3002686500549316, "created_at": "2025-06-03T04:10:13.479871+00:00"} {"global_step": 230760, "acc_step": 0, "speed/wps": 5521.639963610062, "speed/FLOPS": 244028224076190.06, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04243803024291992, "optim/lr": 2.9232682003685674e-05, "optim/total_tokens": 1935755182080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.293179988861084, "created_at": "2025-06-03T04:10:16.450823+00:00"} {"global_step": 230761, "acc_step": 0, "speed/wps": 5523.71013545397, "speed/FLOPS": 244119715075590.72, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04148371145129204, "optim/lr": 2.9229134778591127e-05, "optim/total_tokens": 1935763570688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2974239587783813, "created_at": "2025-06-03T04:10:19.420560+00:00"} {"global_step": 230762, "acc_step": 0, "speed/wps": 5530.323045863649, "speed/FLOPS": 244411971867754.66, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04291403293609619, "optim/lr": 2.922558755349658e-05, "optim/total_tokens": 1935771959296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.302769660949707, "created_at": "2025-06-03T04:10:22.390223+00:00"} {"global_step": 230763, "acc_step": 0, "speed/wps": 5514.6706876408, "speed/FLOPS": 243720217750336.8, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04845161363482475, "optim/lr": 2.9222040328402035e-05, "optim/total_tokens": 1935780347904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2980657815933228, "created_at": "2025-06-03T04:10:25.367306+00:00"} {"global_step": 230764, "acc_step": 0, "speed/wps": 5524.096940666841, "speed/FLOPS": 244136809886151.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04324134439229965, "optim/lr": 2.921849310330771e-05, "optim/total_tokens": 1935788736512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3027029037475586, "created_at": "2025-06-03T04:10:28.336931+00:00"} {"global_step": 230765, "acc_step": 0, "speed/wps": 5519.334974272435, "speed/FLOPS": 243926355345471.88, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041377365589141846, "optim/lr": 2.9214945878213162e-05, "optim/total_tokens": 1935797125120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2943339347839355, "created_at": "2025-06-03T04:10:31.312943+00:00"} {"global_step": 230766, "acc_step": 0, "speed/wps": 5506.831128385889, "speed/FLOPS": 243373749357771.6, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.8 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.8, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04249123856425285, "optim/lr": 2.9211398653118616e-05, "optim/total_tokens": 1935805513728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2938190698623657, "created_at": "2025-06-03T04:10:34.294813+00:00"} {"global_step": 230767, "acc_step": 0, "speed/wps": 5528.260544850403, "speed/FLOPS": 244320819879806.38, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04077288880944252, "optim/lr": 2.920785142802407e-05, "optim/total_tokens": 1935813902336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2944490909576416, "created_at": "2025-06-03T04:10:37.267435+00:00"} {"global_step": 230768, "acc_step": 0, "speed/wps": 5528.539524110667, "speed/FLOPS": 244333149335164.75, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04260080307722092, "optim/lr": 2.9204304202929743e-05, "optim/total_tokens": 1935822290944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3005329370498657, "created_at": "2025-06-03T04:10:40.234569+00:00"} {"global_step": 230769, "acc_step": 0, "speed/wps": 5524.7019486803965, "speed/FLOPS": 244163548143638.47, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041852664202451706, "optim/lr": 2.9200756977835197e-05, "optim/total_tokens": 1935830679552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3043112754821777, "created_at": "2025-06-03T04:10:43.204153+00:00"} {"global_step": 230770, "acc_step": 0, "speed/wps": 5527.343886593308, "speed/FLOPS": 244280308276725.06, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041383594274520874, "optim/lr": 2.919720975274065e-05, "optim/total_tokens": 1935839068160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3041547536849976, "created_at": "2025-06-03T04:10:46.175907+00:00"} {"global_step": 230771, "acc_step": 0, "speed/wps": 5514.806060189143, "speed/FLOPS": 243726200524074.06, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0431344211101532, "optim/lr": 2.9193662527646104e-05, "optim/total_tokens": 1935847456768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3064262866973877, "created_at": "2025-06-03T04:10:49.153860+00:00"} {"global_step": 230772, "acc_step": 0, "speed/wps": 5513.697807101701, "speed/FLOPS": 243677221410162.66, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04375009983778, "optim/lr": 2.9190115302551778e-05, "optim/total_tokens": 1935855845376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.304029107093811, "created_at": "2025-06-03T04:10:52.132767+00:00"} {"global_step": 230773, "acc_step": 0, "speed/wps": 5520.768346565126, "speed/FLOPS": 243989703064144.34, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04034187272191048, "optim/lr": 2.918656807745723e-05, "optim/total_tokens": 1935864233984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2987287044525146, "created_at": "2025-06-03T04:10:55.105212+00:00"} {"global_step": 230774, "acc_step": 0, "speed/wps": 5520.267073726454, "speed/FLOPS": 243967549370422.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041325557976961136, "optim/lr": 2.9183020852362685e-05, "optim/total_tokens": 1935872622592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.303636074066162, "created_at": "2025-06-03T04:10:58.080590+00:00"} {"global_step": 230775, "acc_step": 0, "speed/wps": 5521.462589488777, "speed/FLOPS": 244020385047912.28, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04445240646600723, "optim/lr": 2.917947362726814e-05, "optim/total_tokens": 1935881011200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2848707437515259, "created_at": "2025-06-03T04:11:01.055561+00:00"} {"global_step": 230776, "acc_step": 0, "speed/wps": 5526.96703244232, "speed/FLOPS": 244263653252165.78, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04076582193374634, "optim/lr": 2.9175926402173812e-05, "optim/total_tokens": 1935889399808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2987534999847412, "created_at": "2025-06-03T04:11:04.024214+00:00"} {"global_step": 230777, "acc_step": 0, "speed/wps": 5526.67314522839, "speed/FLOPS": 244250664941561.22, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04423220455646515, "optim/lr": 2.9172379177079266e-05, "optim/total_tokens": 1935897788416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3106900453567505, "created_at": "2025-06-03T04:11:06.992849+00:00"} {"global_step": 230778, "acc_step": 0, "speed/wps": 5521.951088618858, "speed/FLOPS": 244041974209096.7, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04911863058805466, "optim/lr": 2.916883195198472e-05, "optim/total_tokens": 1935906177024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3045705556869507, "created_at": "2025-06-03T04:11:09.963995+00:00"} {"global_step": 230779, "acc_step": 0, "speed/wps": 5516.417238180586, "speed/FLOPS": 243797406344539.28, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04541519284248352, "optim/lr": 2.9165284726890173e-05, "optim/total_tokens": 1935914565632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2983405590057373, "created_at": "2025-06-03T04:11:12.940950+00:00"} {"global_step": 230780, "acc_step": 0, "speed/wps": 5511.789832132586, "speed/FLOPS": 243592898682428.94, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04557747766375542, "optim/lr": 2.9161737501795847e-05, "optim/total_tokens": 1935922954240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3050428628921509, "created_at": "2025-06-03T04:11:15.920947+00:00"} {"global_step": 230781, "acc_step": 0, "speed/wps": 5516.0191582629595, "speed/FLOPS": 243779813249737.94, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041480302810668945, "optim/lr": 2.91581902767013e-05, "optim/total_tokens": 1935931342848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2973021268844604, "created_at": "2025-06-03T04:11:18.897739+00:00"} {"global_step": 230782, "acc_step": 0, "speed/wps": 5515.323819893603, "speed/FLOPS": 243749082852876.8, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05148496478796005, "optim/lr": 2.9154643051606754e-05, "optim/total_tokens": 1935939731456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2930830717086792, "created_at": "2025-06-03T04:11:21.873889+00:00"} {"global_step": 230783, "acc_step": 0, "speed/wps": 5514.80753613869, "speed/FLOPS": 243726265753489.44, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.047354113310575485, "optim/lr": 2.9151095826512208e-05, "optim/total_tokens": 1935948120064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3253285884857178, "created_at": "2025-06-03T04:11:24.851034+00:00"} {"global_step": 230784, "acc_step": 0, "speed/wps": 5528.030887439093, "speed/FLOPS": 244310670197719.66, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04727835953235626, "optim/lr": 2.9147548601417885e-05, "optim/total_tokens": 1935956508672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2996410131454468, "created_at": "2025-06-03T04:11:27.818621+00:00"} {"global_step": 230785, "acc_step": 0, "speed/wps": 5525.315674572661, "speed/FLOPS": 244190671686742.7, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.057442136108875275, "optim/lr": 2.9144001376323335e-05, "optim/total_tokens": 1935964897280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2883332967758179, "created_at": "2025-06-03T04:11:30.788103+00:00"} {"global_step": 230786, "acc_step": 0, "speed/wps": 5512.913352485966, "speed/FLOPS": 243642552531349.88, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041718702763319016, "optim/lr": 2.914045415122879e-05, "optim/total_tokens": 1935973285888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3033554553985596, "created_at": "2025-06-03T04:11:33.764258+00:00"} {"global_step": 230787, "acc_step": 0, "speed/wps": 5518.148722411742, "speed/FLOPS": 243873929085016.7, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.056416019797325134, "optim/lr": 2.9136906926134466e-05, "optim/total_tokens": 1935981674496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3033543825149536, "created_at": "2025-06-03T04:11:36.737407+00:00"} {"global_step": 230788, "acc_step": 0, "speed/wps": 5509.278890410045, "speed/FLOPS": 243481927910457.47, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04352680221199989, "optim/lr": 2.913335970103992e-05, "optim/total_tokens": 1935990063104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2978426218032837, "created_at": "2025-06-03T04:11:39.719148+00:00"} {"global_step": 230789, "acc_step": 0, "speed/wps": 5528.160007127078, "speed/FLOPS": 244316376627034.12, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.050910841673612595, "optim/lr": 2.9129812475945373e-05, "optim/total_tokens": 1935998451712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2945135831832886, "created_at": "2025-06-03T04:11:42.690392+00:00"} {"global_step": 230790, "acc_step": 0, "speed/wps": 5502.651028551291, "speed/FLOPS": 243189010340772.88, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.79 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.79, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04591231048107147, "optim/lr": 2.9126265250850827e-05, "optim/total_tokens": 1936006840320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3024165630340576, "created_at": "2025-06-03T04:11:45.675811+00:00"} {"global_step": 230791, "acc_step": 0, "speed/wps": 5516.56714188383, "speed/FLOPS": 243804031320945.97, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04623491317033768, "optim/lr": 2.91227180257565e-05, "optim/total_tokens": 1936015228928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3014743328094482, "created_at": "2025-06-03T04:11:48.649344+00:00"} {"global_step": 230792, "acc_step": 0, "speed/wps": 5527.445236073169, "speed/FLOPS": 244284787404981.28, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046989716589450836, "optim/lr": 2.9119170800661954e-05, "optim/total_tokens": 1936023617536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3003324270248413, "created_at": "2025-06-03T04:11:51.620994+00:00"} {"global_step": 230793, "acc_step": 0, "speed/wps": 5523.799319107233, "speed/FLOPS": 244123656536581.62, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04743366688489914, "optim/lr": 2.9115623575567408e-05, "optim/total_tokens": 1936032006144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3027700185775757, "created_at": "2025-06-03T04:11:54.595667+00:00"} {"global_step": 230794, "acc_step": 0, "speed/wps": 5526.743613272188, "speed/FLOPS": 244253779268408.94, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 189.93, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04255412891507149, "optim/lr": 2.911207635047286e-05, "optim/total_tokens": 1936040394752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3078274726867676, "created_at": "2025-06-03T04:11:57.564636+00:00"} {"global_step": 230795, "acc_step": 0, "speed/wps": 5524.16896536885, "speed/FLOPS": 244139993009324.0, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04423626884818077, "optim/lr": 2.9108529125378535e-05, "optim/total_tokens": 1936048783360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3204634189605713, "created_at": "2025-06-03T04:12:00.534375+00:00"} {"global_step": 230796, "acc_step": 0, "speed/wps": 5529.773394220964, "speed/FLOPS": 244387680078520.16, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04252787306904793, "optim/lr": 2.910498190028399e-05, "optim/total_tokens": 1936057171968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.295932650566101, "created_at": "2025-06-03T04:12:03.501326+00:00"} {"global_step": 230797, "acc_step": 0, "speed/wps": 5527.701213546867, "speed/FLOPS": 244296100299107.22, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04257464408874512, "optim/lr": 2.9101434675189443e-05, "optim/total_tokens": 1936065560576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.303225040435791, "created_at": "2025-06-03T04:12:06.469108+00:00"} {"global_step": 230798, "acc_step": 0, "speed/wps": 5516.269645720498, "speed/FLOPS": 243790883513250.12, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04354948550462723, "optim/lr": 2.9097887450094896e-05, "optim/total_tokens": 1936073949184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3232461214065552, "created_at": "2025-06-03T04:12:09.443512+00:00"} {"global_step": 230799, "acc_step": 0, "speed/wps": 5512.258867752809, "speed/FLOPS": 243613627656100.9, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.77 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.77, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.049652405083179474, "optim/lr": 2.909434022500057e-05, "optim/total_tokens": 1936082337792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3080945014953613, "created_at": "2025-06-03T04:12:12.423369+00:00"} {"global_step": 230800, "acc_step": 0, "speed/wps": 5501.6841871107945, "speed/FLOPS": 243146280897846.03, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.78 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.78, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042119864374399185, "optim/lr": 2.9090792999906024e-05, "optim/total_tokens": 1936090726400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3099008798599243, "created_at": "2025-06-03T04:12:15.406016+00:00"} {"global_step": 230801, "acc_step": 0, "speed/wps": 5533.760515503875, "speed/FLOPS": 244563890431288.03, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04929206147789955, "optim/lr": 2.9087245774811477e-05, "optim/total_tokens": 1936099115008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3011945486068726, "created_at": "2025-06-03T04:12:18.373529+00:00"} {"global_step": 230802, "acc_step": 0, "speed/wps": 5531.524917939307, "speed/FLOPS": 244465088461759.78, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04136953502893448, "optim/lr": 2.908369854971693e-05, "optim/total_tokens": 1936107503616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3110096454620361, "created_at": "2025-06-03T04:12:21.339393+00:00"} {"global_step": 230803, "acc_step": 0, "speed/wps": 5523.963030000449, "speed/FLOPS": 244130891720113.47, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.049782637506723404, "optim/lr": 2.9080151324622605e-05, "optim/total_tokens": 1936115892224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3042343854904175, "created_at": "2025-06-03T04:12:24.310157+00:00"} {"global_step": 230804, "acc_step": 0, "speed/wps": 5517.9353724231105, "speed/FLOPS": 243864500107543.4, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04171321168541908, "optim/lr": 2.9076604099528058e-05, "optim/total_tokens": 1936124280832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3013012409210205, "created_at": "2025-06-03T04:12:27.283822+00:00"} {"global_step": 230805, "acc_step": 0, "speed/wps": 5526.446061058811, "speed/FLOPS": 244240628983587.97, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05136178806424141, "optim/lr": 2.9073056874433512e-05, "optim/total_tokens": 1936132669440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.299788475036621, "created_at": "2025-06-03T04:12:30.252226+00:00"} {"global_step": 230806, "acc_step": 0, "speed/wps": 5518.719019372599, "speed/FLOPS": 243899133291642.12, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04187195375561714, "optim/lr": 2.9069509649338965e-05, "optim/total_tokens": 1936141058048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.29962956905365, "created_at": "2025-06-03T04:12:33.224445+00:00"} {"global_step": 230807, "acc_step": 0, "speed/wps": 5513.63007591669, "speed/FLOPS": 243674228038464.78, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05272900313138962, "optim/lr": 2.906596242424464e-05, "optim/total_tokens": 1936149446656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3032875061035156, "created_at": "2025-06-03T04:12:36.203263+00:00"} {"global_step": 230808, "acc_step": 0, "speed/wps": 5524.9820750106, "speed/FLOPS": 244175928293616.94, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04120345413684845, "optim/lr": 2.9062415199150093e-05, "optim/total_tokens": 1936157835264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3088781833648682, "created_at": "2025-06-03T04:12:39.172733+00:00"} {"global_step": 230809, "acc_step": 0, "speed/wps": 5534.599036169398, "speed/FLOPS": 244600948752766.3, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04806884378194809, "optim/lr": 2.9058867974055547e-05, "optim/total_tokens": 1936166223872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3079699277877808, "created_at": "2025-06-03T04:12:42.137233+00:00"} {"global_step": 230810, "acc_step": 0, "speed/wps": 5528.9457566047795, "speed/FLOPS": 244351102732118.12, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04092131182551384, "optim/lr": 2.9055320748961e-05, "optim/total_tokens": 1936174612480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3122427463531494, "created_at": "2025-06-03T04:12:45.104221+00:00"} {"global_step": 230811, "acc_step": 0, "speed/wps": 5533.385491870144, "speed/FLOPS": 244547316306222.1, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04866016283631325, "optim/lr": 2.9051773523866677e-05, "optim/total_tokens": 1936183001088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2914364337921143, "created_at": "2025-06-03T04:12:48.069186+00:00"} {"global_step": 230812, "acc_step": 0, "speed/wps": 5527.20724356614, "speed/FLOPS": 244274269354326.66, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04173131287097931, "optim/lr": 2.9048226298772128e-05, "optim/total_tokens": 1936191389696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2867871522903442, "created_at": "2025-06-03T04:12:51.037555+00:00"} {"global_step": 230813, "acc_step": 0, "speed/wps": 5516.975482781741, "speed/FLOPS": 243822077898555.47, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0539463609457016, "optim/lr": 2.904467907367758e-05, "optim/total_tokens": 1936199778304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2928893566131592, "created_at": "2025-06-03T04:12:54.014502+00:00"} {"global_step": 230814, "acc_step": 0, "speed/wps": 5510.814303233451, "speed/FLOPS": 243549785298296.75, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.044768113642930984, "optim/lr": 2.904113184858326e-05, "optim/total_tokens": 1936208166912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3050220012664795, "created_at": "2025-06-03T04:12:56.991912+00:00"} {"global_step": 230815, "acc_step": 0, "speed/wps": 5520.511016387119, "speed/FLOPS": 243978330387411.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04940374940633774, "optim/lr": 2.9037584623488712e-05, "optim/total_tokens": 1936216555520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.305040717124939, "created_at": "2025-06-03T04:12:59.963807+00:00"} {"global_step": 230816, "acc_step": 0, "speed/wps": 5510.219597667526, "speed/FLOPS": 243523502356261.88, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04248203709721565, "optim/lr": 2.9034037398394166e-05, "optim/total_tokens": 1936224944128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3016655445098877, "created_at": "2025-06-03T04:13:02.940980+00:00"} {"global_step": 230817, "acc_step": 0, "speed/wps": 5516.8160368689105, "speed/FLOPS": 243815031205326.5, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.050578951835632324, "optim/lr": 2.9030490173299616e-05, "optim/total_tokens": 1936233332736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3097976446151733, "created_at": "2025-06-03T04:13:05.917180+00:00"} {"global_step": 230818, "acc_step": 0, "speed/wps": 5509.398691916992, "speed/FLOPS": 243487222523864.8, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.76 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.76, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04291355237364769, "optim/lr": 2.9026942948205293e-05, "optim/total_tokens": 1936241721344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2985734939575195, "created_at": "2025-06-03T04:13:08.895321+00:00"} {"global_step": 230819, "acc_step": 0, "speed/wps": 5519.064930703842, "speed/FLOPS": 243914420801948.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.049429912120103836, "optim/lr": 2.9023395723110747e-05, "optim/total_tokens": 1936250109952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2879136800765991, "created_at": "2025-06-03T04:13:11.868476+00:00"} {"global_step": 230820, "acc_step": 0, "speed/wps": 5525.658816787572, "speed/FLOPS": 244205836816280.66, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04215265065431595, "optim/lr": 2.90198484980162e-05, "optim/total_tokens": 1936258498560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2876802682876587, "created_at": "2025-06-03T04:13:14.837575+00:00"} {"global_step": 230821, "acc_step": 0, "speed/wps": 5526.238930364919, "speed/FLOPS": 244231474867108.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.047652725130319595, "optim/lr": 2.9016301272921654e-05, "optim/total_tokens": 1936266887168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2942582368850708, "created_at": "2025-06-03T04:13:17.805910+00:00"} {"global_step": 230822, "acc_step": 0, "speed/wps": 5523.908977383203, "speed/FLOPS": 244128502871097.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04228532686829567, "optim/lr": 2.9012754047827328e-05, "optim/total_tokens": 1936275275776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2977420091629028, "created_at": "2025-06-03T04:13:20.775911+00:00"} {"global_step": 230823, "acc_step": 0, "speed/wps": 5520.230520021401, "speed/FLOPS": 243965933883757.5, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04777085408568382, "optim/lr": 2.900920682273278e-05, "optim/total_tokens": 1936283664384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.317299723625183, "created_at": "2025-06-03T04:13:23.750615+00:00"} {"global_step": 230824, "acc_step": 0, "speed/wps": 5521.5128635401325, "speed/FLOPS": 244022606903656.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04181014373898506, "optim/lr": 2.9005659597638235e-05, "optim/total_tokens": 1936292052992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3094401359558105, "created_at": "2025-06-03T04:13:26.721475+00:00"} {"global_step": 230825, "acc_step": 0, "speed/wps": 5519.62611378589, "speed/FLOPS": 243939222221779.47, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04476802423596382, "optim/lr": 2.900211237254369e-05, "optim/total_tokens": 1936300441600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3087788820266724, "created_at": "2025-06-03T04:13:29.697814+00:00"} {"global_step": 230826, "acc_step": 0, "speed/wps": 5532.185626056006, "speed/FLOPS": 244494288378707.2, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041073430329561234, "optim/lr": 2.8998565147449362e-05, "optim/total_tokens": 1936308830208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2895137071609497, "created_at": "2025-06-03T04:13:32.664763+00:00"} {"global_step": 230827, "acc_step": 0, "speed/wps": 5528.858472705365, "speed/FLOPS": 244347245230523.5, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046488337218761444, "optim/lr": 2.8995017922354816e-05, "optim/total_tokens": 1936317218816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.283458948135376, "created_at": "2025-06-03T04:13:35.635536+00:00"} {"global_step": 230828, "acc_step": 0, "speed/wps": 5528.735651498798, "speed/FLOPS": 244341817161849.16, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04227335751056671, "optim/lr": 2.899147069726027e-05, "optim/total_tokens": 1936325607424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3117934465408325, "created_at": "2025-06-03T04:13:38.603239+00:00"} {"global_step": 230829, "acc_step": 0, "speed/wps": 5527.913758267866, "speed/FLOPS": 244305493687872.88, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04297597333788872, "optim/lr": 2.8987923472165723e-05, "optim/total_tokens": 1936333996032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3048174381256104, "created_at": "2025-06-03T04:13:41.572803+00:00"} {"global_step": 230830, "acc_step": 0, "speed/wps": 5509.698861907285, "speed/FLOPS": 243500488501026.5, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04418734088540077, "optim/lr": 2.8984376247071397e-05, "optim/total_tokens": 1936342384640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3091390132904053, "created_at": "2025-06-03T04:13:44.550823+00:00"} {"global_step": 230831, "acc_step": 0, "speed/wps": 5500.390297579147, "speed/FLOPS": 243089097603274.2, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05069123953580856, "optim/lr": 2.898082902197685e-05, "optim/total_tokens": 1936350773248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3126779794692993, "created_at": "2025-06-03T04:13:47.533027+00:00"} {"global_step": 230832, "acc_step": 0, "speed/wps": 5515.233623293037, "speed/FLOPS": 243745096624799.84, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042667850852012634, "optim/lr": 2.8977281796882304e-05, "optim/total_tokens": 1936359161856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3069603443145752, "created_at": "2025-06-03T04:13:50.507681+00:00"} {"global_step": 230833, "acc_step": 0, "speed/wps": 5514.350864911167, "speed/FLOPS": 243706083222688.2, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.74 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.74, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04802648723125458, "optim/lr": 2.8973734571787758e-05, "optim/total_tokens": 1936367550464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3009002208709717, "created_at": "2025-06-03T04:13:53.483254+00:00"} {"global_step": 230834, "acc_step": 0, "speed/wps": 5515.738437222394, "speed/FLOPS": 243767406816605.47, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041022852063179016, "optim/lr": 2.897018734669343e-05, "optim/total_tokens": 1936375939072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3188612461090088, "created_at": "2025-06-03T04:13:56.461766+00:00"} {"global_step": 230835, "acc_step": 0, "speed/wps": 5523.121091052563, "speed/FLOPS": 244093682328051.1, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04356412962079048, "optim/lr": 2.8966640121598885e-05, "optim/total_tokens": 1936384327680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2805737257003784, "created_at": "2025-06-03T04:13:59.436000+00:00"} {"global_step": 230836, "acc_step": 0, "speed/wps": 5525.082126703199, "speed/FLOPS": 244180350066318.8, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0404079370200634, "optim/lr": 2.896309289650434e-05, "optim/total_tokens": 1936392716288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3088384866714478, "created_at": "2025-06-03T04:14:02.410660+00:00"} {"global_step": 230837, "acc_step": 0, "speed/wps": 5529.799508332767, "speed/FLOPS": 244388834188597.7, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046910665929317474, "optim/lr": 2.8959545671409792e-05, "optim/total_tokens": 1936401104896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3038092851638794, "created_at": "2025-06-03T04:14:05.379797+00:00"} {"global_step": 230838, "acc_step": 0, "speed/wps": 5518.598713943948, "speed/FLOPS": 243893816407474.72, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04157311096787453, "optim/lr": 2.8955998446315466e-05, "optim/total_tokens": 1936409493504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2996338605880737, "created_at": "2025-06-03T04:14:08.356442+00:00"} {"global_step": 230839, "acc_step": 0, "speed/wps": 5535.065212307574, "speed/FLOPS": 244621551351967.94, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 189.75, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.053794171661138535, "optim/lr": 2.895245122122092e-05, "optim/total_tokens": 1936417882112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2961187362670898, "created_at": "2025-06-03T04:14:11.321705+00:00"} {"global_step": 230840, "acc_step": 0, "speed/wps": 5528.892615557486, "speed/FLOPS": 244348754169828.3, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04228200390934944, "optim/lr": 2.8948903996126374e-05, "optim/total_tokens": 1936426270720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3026655912399292, "created_at": "2025-06-03T04:14:14.288992+00:00"} {"global_step": 230841, "acc_step": 0, "speed/wps": 5518.50049169913, "speed/FLOPS": 243889475487000.8, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.048928599804639816, "optim/lr": 2.894535677103205e-05, "optim/total_tokens": 1936434659328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3133175373077393, "created_at": "2025-06-03T04:14:17.266992+00:00"} {"global_step": 230842, "acc_step": 0, "speed/wps": 5500.8471486796525, "speed/FLOPS": 243109288083540.62, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.75 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.75, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04409411549568176, "optim/lr": 2.8941809545937504e-05, "optim/total_tokens": 1936443047936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.287102222442627, "created_at": "2025-06-03T04:14:20.252925+00:00"} {"global_step": 230843, "acc_step": 0, "speed/wps": 5524.519807675153, "speed/FLOPS": 244155498443488.9, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04348480701446533, "optim/lr": 2.8938262320842958e-05, "optim/total_tokens": 1936451436544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.289084553718567, "created_at": "2025-06-03T04:14:23.226085+00:00"} {"global_step": 230844, "acc_step": 0, "speed/wps": 5523.36259158335, "speed/FLOPS": 244104355415400.1, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046098366379737854, "optim/lr": 2.8934715095748408e-05, "optim/total_tokens": 1936459825152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3082165718078613, "created_at": "2025-06-03T04:14:26.196325+00:00"} {"global_step": 230845, "acc_step": 0, "speed/wps": 5536.391162888857, "speed/FLOPS": 244680151580830.3, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 189.71, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04276403784751892, "optim/lr": 2.8931167870654085e-05, "optim/total_tokens": 1936468213760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.28782057762146, "created_at": "2025-06-03T04:14:29.159999+00:00"} {"global_step": 230846, "acc_step": 0, "speed/wps": 5520.020665825094, "speed/FLOPS": 243956659402411.84, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04350188747048378, "optim/lr": 2.892762064555954e-05, "optim/total_tokens": 1936476602368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.287894368171692, "created_at": "2025-06-03T04:14:32.132279+00:00"} {"global_step": 230847, "acc_step": 0, "speed/wps": 5514.275241118336, "speed/FLOPS": 243702741038122.72, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04404858872294426, "optim/lr": 2.8924073420464993e-05, "optim/total_tokens": 1936484990976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3038772344589233, "created_at": "2025-06-03T04:14:35.111820+00:00"} {"global_step": 230848, "acc_step": 0, "speed/wps": 5526.654750779873, "speed/FLOPS": 244249852001088.1, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0429435633122921, "optim/lr": 2.8920526195370446e-05, "optim/total_tokens": 1936493379584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2892835140228271, "created_at": "2025-06-03T04:14:38.080323+00:00"} {"global_step": 230849, "acc_step": 0, "speed/wps": 5514.868205047758, "speed/FLOPS": 243728947008738.62, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0433795303106308, "optim/lr": 2.891697897027612e-05, "optim/total_tokens": 1936501768192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3009756803512573, "created_at": "2025-06-03T04:14:41.058881+00:00"} {"global_step": 230850, "acc_step": 0, "speed/wps": 5506.316544049398, "speed/FLOPS": 243351007363980.06, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041705138981342316, "optim/lr": 2.8913431745181574e-05, "optim/total_tokens": 1936510156800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3108017444610596, "created_at": "2025-06-03T04:14:44.039283+00:00"} {"global_step": 230851, "acc_step": 0, "speed/wps": 5520.651427931976, "speed/FLOPS": 243984535859002.94, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043929703533649445, "optim/lr": 2.8909884520087027e-05, "optim/total_tokens": 1936518545408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.297237515449524, "created_at": "2025-06-03T04:14:47.011827+00:00"} {"global_step": 230852, "acc_step": 0, "speed/wps": 5529.665080324442, "speed/FLOPS": 244382893158694.62, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 189.95, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04304200038313866, "optim/lr": 2.890633729499248e-05, "optim/total_tokens": 1936526934016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.296560287475586, "created_at": "2025-06-03T04:14:49.979800+00:00"} {"global_step": 230853, "acc_step": 0, "speed/wps": 5525.379335088089, "speed/FLOPS": 244193485155680.53, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04142739996314049, "optim/lr": 2.8902790069898155e-05, "optim/total_tokens": 1936535322624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.305618166923523, "created_at": "2025-06-03T04:14:52.950777+00:00"} {"global_step": 230854, "acc_step": 0, "speed/wps": 5521.897540741354, "speed/FLOPS": 244039607666993.84, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04565365985035896, "optim/lr": 2.889924284480361e-05, "optim/total_tokens": 1936543711232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3068183660507202, "created_at": "2025-06-03T04:14:55.923808+00:00"} {"global_step": 230855, "acc_step": 0, "speed/wps": 5527.269115990842, "speed/FLOPS": 244277003798806.7, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04071090742945671, "optim/lr": 2.8895695619709062e-05, "optim/total_tokens": 1936552099840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.313839316368103, "created_at": "2025-06-03T04:14:58.895048+00:00"} {"global_step": 230856, "acc_step": 0, "speed/wps": 5518.111089439821, "speed/FLOPS": 243872265900280.78, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.040889766067266464, "optim/lr": 2.8892148394614516e-05, "optim/total_tokens": 1936560488448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3033795356750488, "created_at": "2025-06-03T04:15:01.870776+00:00"} {"global_step": 230857, "acc_step": 0, "speed/wps": 5525.4076607448915, "speed/FLOPS": 244194737004727.34, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04174702242016792, "optim/lr": 2.888860116952019e-05, "optim/total_tokens": 1936568877056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.300257682800293, "created_at": "2025-06-03T04:15:04.846148+00:00"} {"global_step": 230858, "acc_step": 0, "speed/wps": 5507.778581077926, "speed/FLOPS": 243415621917257.12, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04190471023321152, "optim/lr": 2.8885053944425643e-05, "optim/total_tokens": 1936577265664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.30158531665802, "created_at": "2025-06-03T04:15:07.825847+00:00"} {"global_step": 230859, "acc_step": 0, "speed/wps": 5505.167143926093, "speed/FLOPS": 243300209761693.12, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.73 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.73, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04173438251018524, "optim/lr": 2.8881506719331097e-05, "optim/total_tokens": 1936585654272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3036272525787354, "created_at": "2025-06-03T04:15:10.805825+00:00"} {"global_step": 230860, "acc_step": 0, "speed/wps": 5531.948840778477, "speed/FLOPS": 244483823681417.3, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04824952408671379, "optim/lr": 2.887795949423655e-05, "optim/total_tokens": 1936594042880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2998566627502441, "created_at": "2025-06-03T04:15:13.771769+00:00"} {"global_step": 230861, "acc_step": 0, "speed/wps": 5532.413828513654, "speed/FLOPS": 244504373759289.16, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043893493711948395, "optim/lr": 2.8874412269142224e-05, "optim/total_tokens": 1936602431488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2969716787338257, "created_at": "2025-06-03T04:15:16.736915+00:00"} {"global_step": 230862, "acc_step": 0, "speed/wps": 5523.154785496776, "speed/FLOPS": 244095171450021.5, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043566249310970306, "optim/lr": 2.8870865044047678e-05, "optim/total_tokens": 1936610820096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3035506010055542, "created_at": "2025-06-03T04:15:19.707993+00:00"} {"global_step": 230863, "acc_step": 0, "speed/wps": 5520.831105791922, "speed/FLOPS": 243992476700737.88, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04417232424020767, "optim/lr": 2.886731781895313e-05, "optim/total_tokens": 1936619208704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3009682893753052, "created_at": "2025-06-03T04:15:22.679915+00:00"} {"global_step": 230864, "acc_step": 0, "speed/wps": 5512.103564754559, "speed/FLOPS": 243606764058491.03, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04186196252703667, "optim/lr": 2.8863770593858585e-05, "optim/total_tokens": 1936627597312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2905091047286987, "created_at": "2025-06-03T04:15:25.657685+00:00"} {"global_step": 230865, "acc_step": 0, "speed/wps": 5528.679715822026, "speed/FLOPS": 244339345091240.6, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04545273259282112, "optim/lr": 2.886022336876426e-05, "optim/total_tokens": 1936635985920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2967509031295776, "created_at": "2025-06-03T04:15:28.624799+00:00"} {"global_step": 230866, "acc_step": 0, "speed/wps": 5514.810240391491, "speed/FLOPS": 243726385267621.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043791208416223526, "optim/lr": 2.8856676143669712e-05, "optim/total_tokens": 1936644374528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3205534219741821, "created_at": "2025-06-03T04:15:31.599925+00:00"} {"global_step": 230867, "acc_step": 0, "speed/wps": 5508.642352729319, "speed/FLOPS": 243453796203064.6, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.72 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.72, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04121725633740425, "optim/lr": 2.8853128918575166e-05, "optim/total_tokens": 1936652763136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2937089204788208, "created_at": "2025-06-03T04:15:34.578661+00:00"} {"global_step": 230868, "acc_step": 0, "speed/wps": 5527.511744021675, "speed/FLOPS": 244287726715886.7, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04253657907247543, "optim/lr": 2.8849581693480843e-05, "optim/total_tokens": 1936661151744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2991172075271606, "created_at": "2025-06-03T04:15:37.550516+00:00"} {"global_step": 230869, "acc_step": 0, "speed/wps": 5528.158078438846, "speed/FLOPS": 244316291388886.2, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041263654828071594, "optim/lr": 2.8846034468386297e-05, "optim/total_tokens": 1936669540352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2819116115570068, "created_at": "2025-06-03T04:15:40.518042+00:00"} {"global_step": 230870, "acc_step": 0, "speed/wps": 5518.568761101146, "speed/FLOPS": 243892492645135.44, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04247570410370827, "optim/lr": 2.8842487243291747e-05, "optim/total_tokens": 1936677928960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.298224687576294, "created_at": "2025-06-03T04:15:43.491300+00:00"} {"global_step": 230871, "acc_step": 0, "speed/wps": 5529.999779329974, "speed/FLOPS": 244397685141594.38, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043537382036447525, "optim/lr": 2.88389400181972e-05, "optim/total_tokens": 1936686317568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2829841375350952, "created_at": "2025-06-03T04:15:46.460070+00:00"} {"global_step": 230872, "acc_step": 0, "speed/wps": 5523.5867000078915, "speed/FLOPS": 244114259860673.94, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04147861897945404, "optim/lr": 2.8835392793102878e-05, "optim/total_tokens": 1936694706176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.310571312904358, "created_at": "2025-06-03T04:15:49.430351+00:00"} {"global_step": 230873, "acc_step": 0, "speed/wps": 5529.906132687882, "speed/FLOPS": 244393546439340.84, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04187101125717163, "optim/lr": 2.883184556800833e-05, "optim/total_tokens": 1936703094784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.3046809434890747, "created_at": "2025-06-03T04:15:52.397091+00:00"} {"global_step": 230874, "acc_step": 0, "speed/wps": 5516.068655674336, "speed/FLOPS": 243782000781970.03, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0022, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.044753558933734894, "optim/lr": 2.8828298342913785e-05, "optim/total_tokens": 1936711483392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2873773574829102, "created_at": "2025-06-03T04:15:55.370803+00:00"} {"global_step": 230875, "acc_step": 0, "speed/wps": 5523.762664841717, "speed/FLOPS": 244122036605659.38, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041685234755277634, "optim/lr": 2.8824751117819235e-05, "optim/total_tokens": 1936719872000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.305875301361084, "created_at": "2025-06-03T04:15:58.340331+00:00"} {"global_step": 230876, "acc_step": 0, "speed/wps": 5513.244323424343, "speed/FLOPS": 243657179752763.3, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042492128908634186, "optim/lr": 2.8821203892724912e-05, "optim/total_tokens": 1936728260608, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3109270334243774, "created_at": "2025-06-03T04:16:01.315673+00:00"} {"global_step": 230877, "acc_step": 0, "speed/wps": 5529.163300669954, "speed/FLOPS": 244360717066307.38, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04299573227763176, "optim/lr": 2.8817656667630366e-05, "optim/total_tokens": 1936736649216, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.308779239654541, "created_at": "2025-06-03T04:16:04.283420+00:00"} {"global_step": 230878, "acc_step": 0, "speed/wps": 5527.828649051597, "speed/FLOPS": 244301732296142.22, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 189.92, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04398562014102936, "optim/lr": 2.881410944253582e-05, "optim/total_tokens": 1936745037824, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3074589967727661, "created_at": "2025-06-03T04:16:07.251133+00:00"} {"global_step": 230879, "acc_step": 0, "speed/wps": 5507.9376347807765, "speed/FLOPS": 243422651276812.44, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.71 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.71, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04228716343641281, "optim/lr": 2.8810562217441273e-05, "optim/total_tokens": 1936753426432, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3205797672271729, "created_at": "2025-06-03T04:16:10.229303+00:00"} {"global_step": 230880, "acc_step": 0, "speed/wps": 5520.3391492988485, "speed/FLOPS": 243970734741805.62, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041208282113075256, "optim/lr": 2.8807014992346947e-05, "optim/total_tokens": 1936761815040, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3046156167984009, "created_at": "2025-06-03T04:16:13.205034+00:00"} {"global_step": 230881, "acc_step": 0, "speed/wps": 5532.046576419179, "speed/FLOPS": 244488143096479.97, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 189.8, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04335789009928703, "optim/lr": 2.88034677672524e-05, "optim/total_tokens": 1936770203648, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2879830598831177, "created_at": "2025-06-03T04:16:16.173042+00:00"} {"global_step": 230882, "acc_step": 0, "speed/wps": 5517.459747660532, "speed/FLOPS": 243843479927505.7, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041877686977386475, "optim/lr": 2.8799920542157854e-05, "optim/total_tokens": 1936778592256, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3019012212753296, "created_at": "2025-06-03T04:16:19.147360+00:00"} {"global_step": 230883, "acc_step": 0, "speed/wps": 5513.73699266272, "speed/FLOPS": 243678953211389.8, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.7 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.7, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04690292850136757, "optim/lr": 2.8796373317063308e-05, "optim/total_tokens": 1936786980864, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3003878593444824, "created_at": "2025-06-03T04:16:22.123032+00:00"} {"global_step": 230884, "acc_step": 0, "speed/wps": 5538.439499180326, "speed/FLOPS": 244770677560577.66, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.047093190252780914, "optim/lr": 2.8792826091968982e-05, "optim/total_tokens": 1936795369472, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3025845289230347, "created_at": "2025-06-03T04:16:25.084994+00:00"} {"global_step": 230885, "acc_step": 0, "speed/wps": 5528.35160888092, "speed/FLOPS": 244324844443847.28, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041629016399383545, "optim/lr": 2.8789278866874435e-05, "optim/total_tokens": 1936803758080, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3094338178634644, "created_at": "2025-06-03T04:16:28.052198+00:00"} {"global_step": 230886, "acc_step": 0, "speed/wps": 5527.913267562144, "speed/FLOPS": 244305472001191.62, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04282711073756218, "optim/lr": 2.878573164177989e-05, "optim/total_tokens": 1936812146688, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2966138124465942, "created_at": "2025-06-03T04:16:31.022501+00:00"} {"global_step": 230887, "acc_step": 0, "speed/wps": 5519.2781520357385, "speed/FLOPS": 243923844093452.47, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04303360357880592, "optim/lr": 2.8782184416685343e-05, "optim/total_tokens": 1936820535296, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2887107133865356, "created_at": "2025-06-03T04:16:33.995846+00:00"} {"global_step": 230888, "acc_step": 0, "speed/wps": 5527.428525431475, "speed/FLOPS": 244284048880151.2, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04903775826096535, "optim/lr": 2.8778637191591016e-05, "optim/total_tokens": 1936828923904, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2899612188339233, "created_at": "2025-06-03T04:16:36.964407+00:00"} {"global_step": 230889, "acc_step": 0, "speed/wps": 5514.822384278302, "speed/FLOPS": 243726921965260.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04179190471768379, "optim/lr": 2.877508996649647e-05, "optim/total_tokens": 1936837312512, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.319559931755066, "created_at": "2025-06-03T04:16:39.940949+00:00"} {"global_step": 230890, "acc_step": 0, "speed/wps": 5528.404985359691, "speed/FLOPS": 244327203411003.34, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05114678665995598, "optim/lr": 2.8771542741401924e-05, "optim/total_tokens": 1936845701120, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2909996509552002, "created_at": "2025-06-03T04:16:42.911641+00:00"} {"global_step": 230891, "acc_step": 0, "speed/wps": 5516.266510638289, "speed/FLOPS": 243790744958663.28, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.69 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.69, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04121541231870651, "optim/lr": 2.8767995516307377e-05, "optim/total_tokens": 1936854089728, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2959011793136597, "created_at": "2025-06-03T04:16:45.887918+00:00"} {"global_step": 230892, "acc_step": 0, "speed/wps": 5520.910068494177, "speed/FLOPS": 243995966448009.78, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046283140778541565, "optim/lr": 2.876444829121305e-05, "optim/total_tokens": 1936862478336, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2996731996536255, "created_at": "2025-06-03T04:16:48.859101+00:00"} {"global_step": 230893, "acc_step": 0, "speed/wps": 5527.795585818196, "speed/FLOPS": 244300271070458.88, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04137048125267029, "optim/lr": 2.8760901066118505e-05, "optim/total_tokens": 1936870866944, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.302936315536499, "created_at": "2025-06-03T04:16:51.826540+00:00"} {"global_step": 230894, "acc_step": 0, "speed/wps": 5532.099333633937, "speed/FLOPS": 244490474695336.38, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04595155268907547, "optim/lr": 2.8757353841023958e-05, "optim/total_tokens": 1936879255552, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3012504577636719, "created_at": "2025-06-03T04:16:54.791653+00:00"} {"global_step": 230895, "acc_step": 0, "speed/wps": 5520.9093802137995, "speed/FLOPS": 243995936029540.06, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04230721667408943, "optim/lr": 2.8753806615929635e-05, "optim/total_tokens": 1936887644160, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3016366958618164, "created_at": "2025-06-03T04:16:57.762704+00:00"} {"global_step": 230896, "acc_step": 0, "speed/wps": 5531.6356580504125, "speed/FLOPS": 244469982607851.38, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04402340576052666, "optim/lr": 2.8750259390835086e-05, "optim/total_tokens": 1936896032768, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2845451831817627, "created_at": "2025-06-03T04:17:00.729383+00:00"} {"global_step": 230897, "acc_step": 0, "speed/wps": 5522.767565202847, "speed/FLOPS": 244078058295003.0, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04676172137260437, "optim/lr": 2.874671216574054e-05, "optim/total_tokens": 1936904421376, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3017382621765137, "created_at": "2025-06-03T04:17:03.699988+00:00"} {"global_step": 230898, "acc_step": 0, "speed/wps": 5535.321997067307, "speed/FLOPS": 244632899924004.6, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04188593477010727, "optim/lr": 2.8743164940645993e-05, "optim/total_tokens": 1936912809984, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.3101892471313477, "created_at": "2025-06-03T04:17:06.667054+00:00"} {"global_step": 230899, "acc_step": 0, "speed/wps": 5522.37592061376, "speed/FLOPS": 244060749608784.06, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05372385308146477, "optim/lr": 2.873961771555167e-05, "optim/total_tokens": 1936921198592, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2890276908874512, "created_at": "2025-06-03T04:17:09.639670+00:00"} {"global_step": 230900, "acc_step": 0, "speed/wps": 5513.674316423714, "speed/FLOPS": 243676183242431.8, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043431635946035385, "optim/lr": 2.8736070490457124e-05, "optim/total_tokens": 1936929587200, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3021193742752075, "created_at": "2025-06-03T04:17:12.618112+00:00"} {"global_step": 230901, "acc_step": 0, "speed/wps": 5523.524265721964, "speed/FLOPS": 244111500584803.6, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0427708700299263, "optim/lr": 2.8732523265362577e-05, "optim/total_tokens": 1936937975808, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.306402325630188, "created_at": "2025-06-03T04:17:15.592568+00:00"} {"global_step": 230902, "acc_step": 0, "speed/wps": 5525.717898799437, "speed/FLOPS": 244208447938795.94, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041004009544849396, "optim/lr": 2.8728976040268028e-05, "optim/total_tokens": 1936946364416, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2778958082199097, "created_at": "2025-06-03T04:17:18.564671+00:00"} {"global_step": 230903, "acc_step": 0, "speed/wps": 5528.528144132356, "speed/FLOPS": 244332646398371.4, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04874378442764282, "optim/lr": 2.8725428815173705e-05, "optim/total_tokens": 1936954753024, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3097426891326904, "created_at": "2025-06-03T04:17:21.535298+00:00"} {"global_step": 230904, "acc_step": 0, "speed/wps": 5521.332159193289, "speed/FLOPS": 244014620696454.5, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04611616209149361, "optim/lr": 2.872188159007916e-05, "optim/total_tokens": 1936963141632, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3088606595993042, "created_at": "2025-06-03T04:17:24.509107+00:00"} {"global_step": 230905, "acc_step": 0, "speed/wps": 5524.808213882301, "speed/FLOPS": 244168244521648.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.040990252047777176, "optim/lr": 2.8718334364984612e-05, "optim/total_tokens": 1936971530240, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3067573308944702, "created_at": "2025-06-03T04:17:27.477903+00:00"} {"global_step": 230906, "acc_step": 0, "speed/wps": 5525.50166922884, "speed/FLOPS": 244198891698538.84, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041443850845098495, "optim/lr": 2.8714787139890066e-05, "optim/total_tokens": 1936979918848, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.290404200553894, "created_at": "2025-06-03T04:17:30.447074+00:00"} {"global_step": 230907, "acc_step": 0, "speed/wps": 5527.686036748674, "speed/FLOPS": 244295429562309.0, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04171411320567131, "optim/lr": 2.871123991479574e-05, "optim/total_tokens": 1936988307456, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2960065603256226, "created_at": "2025-06-03T04:17:33.418850+00:00"} {"global_step": 230908, "acc_step": 0, "speed/wps": 5525.6785579464395, "speed/FLOPS": 244206709274458.22, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04288208857178688, "optim/lr": 2.8707692689701193e-05, "optim/total_tokens": 1936996696064, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2949281930923462, "created_at": "2025-06-03T04:17:36.387204+00:00"} {"global_step": 230909, "acc_step": 0, "speed/wps": 5515.716847439542, "speed/FLOPS": 243766452658709.94, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04490651562809944, "optim/lr": 2.8704145464606647e-05, "optim/total_tokens": 1937005084672, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.274984359741211, "created_at": "2025-06-03T04:17:39.362914+00:00"} {"global_step": 230910, "acc_step": 0, "speed/wps": 5519.190285695408, "speed/FLOPS": 243919960850950.56, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04142340272665024, "optim/lr": 2.87005982395121e-05, "optim/total_tokens": 1937013473280, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.309973120689392, "created_at": "2025-06-03T04:17:42.335038+00:00"} {"global_step": 230911, "acc_step": 0, "speed/wps": 5523.9373616833245, "speed/FLOPS": 244129757311878.9, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04179471731185913, "optim/lr": 2.8697051014417774e-05, "optim/total_tokens": 1937021861888, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2886003255844116, "created_at": "2025-06-03T04:17:45.304700+00:00"} {"global_step": 230912, "acc_step": 0, "speed/wps": 5528.425815039735, "speed/FLOPS": 244328123976245.34, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041403695940971375, "optim/lr": 2.8693503789323228e-05, "optim/total_tokens": 1937030250496, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3159379959106445, "created_at": "2025-06-03T04:17:48.274841+00:00"} {"global_step": 230913, "acc_step": 0, "speed/wps": 5520.287752052629, "speed/FLOPS": 243968463246597.7, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043624669313430786, "optim/lr": 2.868995656422868e-05, "optim/total_tokens": 1937038639104, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2833998203277588, "created_at": "2025-06-03T04:17:51.247746+00:00"} {"global_step": 230914, "acc_step": 0, "speed/wps": 5522.332433979667, "speed/FLOPS": 244058827722141.94, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043846506625413895, "optim/lr": 2.8686409339134135e-05, "optim/total_tokens": 1937047027712, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.3159288167953491, "created_at": "2025-06-03T04:17:54.218912+00:00"} {"global_step": 230915, "acc_step": 0, "speed/wps": 5521.547232436328, "speed/FLOPS": 244024125832952.2, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04445311427116394, "optim/lr": 2.868286211403981e-05, "optim/total_tokens": 1937055416320, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3025550842285156, "created_at": "2025-06-03T04:17:57.191096+00:00"} {"global_step": 230916, "acc_step": 0, "speed/wps": 5514.315883782422, "speed/FLOPS": 243704537235847.28, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04163968190550804, "optim/lr": 2.8679314888945262e-05, "optim/total_tokens": 1937063804928, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.299583911895752, "created_at": "2025-06-03T04:18:00.166062+00:00"} {"global_step": 230917, "acc_step": 0, "speed/wps": 5508.854919562523, "speed/FLOPS": 243463190569076.5, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.68 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.68, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041920047253370285, "optim/lr": 2.8675767663850716e-05, "optim/total_tokens": 1937072193536, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.308537483215332, "created_at": "2025-06-03T04:18:03.144972+00:00"} {"global_step": 230918, "acc_step": 0, "speed/wps": 5518.37248235961, "speed/FLOPS": 243883818129405.22, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04388010874390602, "optim/lr": 2.867222043875617e-05, "optim/total_tokens": 1937080582144, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2903269529342651, "created_at": "2025-06-03T04:18:06.122112+00:00"} {"global_step": 230919, "acc_step": 0, "speed/wps": 5532.386356129126, "speed/FLOPS": 244503159620509.44, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041653916239738464, "optim/lr": 2.8668673213661843e-05, "optim/total_tokens": 1937088970752, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.301954746246338, "created_at": "2025-06-03T04:18:09.089398+00:00"} {"global_step": 230920, "acc_step": 0, "speed/wps": 5527.569302982683, "speed/FLOPS": 244290270527349.78, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04380276799201965, "optim/lr": 2.8665125988567297e-05, "optim/total_tokens": 1937097359360, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3133841753005981, "created_at": "2025-06-03T04:18:12.057055+00:00"} {"global_step": 230921, "acc_step": 0, "speed/wps": 5536.073772747578, "speed/FLOPS": 244666124561135.78, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 189.72, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04427938908338547, "optim/lr": 2.866157876347275e-05, "optim/total_tokens": 1937105747968, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3125097751617432, "created_at": "2025-06-03T04:18:15.021279+00:00"} {"global_step": 230922, "acc_step": 0, "speed/wps": 5527.518434893524, "speed/FLOPS": 244288022418175.4, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041532568633556366, "optim/lr": 2.8658031538378428e-05, "optim/total_tokens": 1937114136576, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.31419038772583, "created_at": "2025-06-03T04:18:17.989265+00:00"} {"global_step": 230923, "acc_step": 0, "speed/wps": 5513.702685069293, "speed/FLOPS": 243677436991362.5, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04348558560013771, "optim/lr": 2.8654484313283878e-05, "optim/total_tokens": 1937122525184, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.299770474433899, "created_at": "2025-06-03T04:18:20.964373+00:00"} {"global_step": 230924, "acc_step": 0, "speed/wps": 5506.493388900223, "speed/FLOPS": 243358823001212.53, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.67 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.67, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04096106067299843, "optim/lr": 2.865093708818933e-05, "optim/total_tokens": 1937130913792, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3098254203796387, "created_at": "2025-06-03T04:18:23.943509+00:00"} {"global_step": 230925, "acc_step": 0, "speed/wps": 5517.7228306868, "speed/FLOPS": 243855106850685.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.044682275503873825, "optim/lr": 2.8647389863094785e-05, "optim/total_tokens": 1937139302400, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2902607917785645, "created_at": "2025-06-03T04:18:26.916699+00:00"} {"global_step": 230926, "acc_step": 0, "speed/wps": 5513.920406482315, "speed/FLOPS": 243687059163418.88, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04140162467956543, "optim/lr": 2.8643842638000462e-05, "optim/total_tokens": 1937147691008, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3029043674468994, "created_at": "2025-06-03T04:18:29.891629+00:00"} {"global_step": 230927, "acc_step": 0, "speed/wps": 5529.215532822184, "speed/FLOPS": 244363025460087.56, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.047642823308706284, "optim/lr": 2.8640295412905916e-05, "optim/total_tokens": 1937156079616, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3085285425186157, "created_at": "2025-06-03T04:18:32.858396+00:00"} {"global_step": 230928, "acc_step": 0, "speed/wps": 5532.196594868958, "speed/FLOPS": 244494773144096.16, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 189.86, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04674005135893822, "optim/lr": 2.8636748187811366e-05, "optim/total_tokens": 1937164468224, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3052587509155273, "created_at": "2025-06-03T04:18:35.823465+00:00"} {"global_step": 230929, "acc_step": 0, "speed/wps": 5524.794886047795, "speed/FLOPS": 244167655499580.94, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04096014052629471, "optim/lr": 2.863320096271682e-05, "optim/total_tokens": 1937172856832, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2984411716461182, "created_at": "2025-06-03T04:18:38.796362+00:00"} {"global_step": 230930, "acc_step": 0, "speed/wps": 5523.645586396113, "speed/FLOPS": 244116862337625.47, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04412573203444481, "optim/lr": 2.8629653737622497e-05, "optim/total_tokens": 1937181245440, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3194153308868408, "created_at": "2025-06-03T04:18:41.768831+00:00"} {"global_step": 230931, "acc_step": 0, "speed/wps": 5524.14419324931, "speed/FLOPS": 244138898208435.53, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041439153254032135, "optim/lr": 2.862610651252795e-05, "optim/total_tokens": 1937189634048, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2992922067642212, "created_at": "2025-06-03T04:18:44.743093+00:00"} {"global_step": 230932, "acc_step": 0, "speed/wps": 5519.647323741716, "speed/FLOPS": 243940159593264.56, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041408903896808624, "optim/lr": 2.8622559287433404e-05, "optim/total_tokens": 1937198022656, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2959833145141602, "created_at": "2025-06-03T04:18:47.717856+00:00"} {"global_step": 230933, "acc_step": 0, "speed/wps": 5522.97724121685, "speed/FLOPS": 244087324901602.8, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0451224222779274, "optim/lr": 2.8619012062338855e-05, "optim/total_tokens": 1937206411264, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3010390996932983, "created_at": "2025-06-03T04:18:50.689283+00:00"} {"global_step": 230934, "acc_step": 0, "speed/wps": 5520.761664228453, "speed/FLOPS": 243989407739066.7, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05045616626739502, "optim/lr": 2.8615464837244532e-05, "optim/total_tokens": 1937214799872, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3182523250579834, "created_at": "2025-06-03T04:18:53.661407+00:00"} {"global_step": 230935, "acc_step": 0, "speed/wps": 5520.151625256098, "speed/FLOPS": 243962447138951.1, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04702692851424217, "optim/lr": 2.8611917612149985e-05, "optim/total_tokens": 1937223188480, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3090931177139282, "created_at": "2025-06-03T04:18:56.638170+00:00"} {"global_step": 230936, "acc_step": 0, "speed/wps": 5519.06742356724, "speed/FLOPS": 243914530973750.94, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04519197717308998, "optim/lr": 2.860837038705544e-05, "optim/total_tokens": 1937231577088, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2891631126403809, "created_at": "2025-06-03T04:18:59.611871+00:00"} {"global_step": 230937, "acc_step": 0, "speed/wps": 5519.338452675135, "speed/FLOPS": 243926509073067.16, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04435737058520317, "optim/lr": 2.8604823161960893e-05, "optim/total_tokens": 1937239965696, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.30999755859375, "created_at": "2025-06-03T04:19:02.586023+00:00"} {"global_step": 230938, "acc_step": 0, "speed/wps": 5534.845034271262, "speed/FLOPS": 244611820609736.28, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04356905445456505, "optim/lr": 2.8601275936866566e-05, "optim/total_tokens": 1937248354304, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.286311388015747, "created_at": "2025-06-03T04:19:05.550265+00:00"} {"global_step": 230939, "acc_step": 0, "speed/wps": 5510.857862420141, "speed/FLOPS": 243551710391392.3, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.66 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.66, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0440954826772213, "optim/lr": 2.859772871177202e-05, "optim/total_tokens": 1937256742912, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3106982707977295, "created_at": "2025-06-03T04:19:08.528327+00:00"} {"global_step": 230940, "acc_step": 0, "speed/wps": 5531.170960231627, "speed/FLOPS": 244449445342800.12, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045454829931259155, "optim/lr": 2.8594181486677474e-05, "optim/total_tokens": 1937265131520, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2894352674484253, "created_at": "2025-06-03T04:19:11.497513+00:00"} {"global_step": 230941, "acc_step": 0, "speed/wps": 5519.182675615685, "speed/FLOPS": 243919624524378.72, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045430365949869156, "optim/lr": 2.8590634261582927e-05, "optim/total_tokens": 1937273520128, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2908127307891846, "created_at": "2025-06-03T04:19:14.473749+00:00"} {"global_step": 230942, "acc_step": 0, "speed/wps": 5510.498393178826, "speed/FLOPS": 243535823690856.56, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0417657233774662, "optim/lr": 2.85870870364886e-05, "optim/total_tokens": 1937281908736, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.296898603439331, "created_at": "2025-06-03T04:19:17.450760+00:00"} {"global_step": 230943, "acc_step": 0, "speed/wps": 5509.959942081807, "speed/FLOPS": 243512026908410.88, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04308586195111275, "optim/lr": 2.8583539811394055e-05, "optim/total_tokens": 1937290297344, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2932283878326416, "created_at": "2025-06-03T04:19:20.431300+00:00"} {"global_step": 230944, "acc_step": 0, "speed/wps": 5529.148410831552, "speed/FLOPS": 244360059011663.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04771290719509125, "optim/lr": 2.8579992586299508e-05, "optim/total_tokens": 1937298685952, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2993009090423584, "created_at": "2025-06-03T04:19:23.398329+00:00"} {"global_step": 230945, "acc_step": 0, "speed/wps": 5523.171013823466, "speed/FLOPS": 244095888658997.1, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04334317892789841, "optim/lr": 2.8576445361204962e-05, "optim/total_tokens": 1937307074560, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.295438528060913, "created_at": "2025-06-03T04:19:26.368822+00:00"} {"global_step": 230946, "acc_step": 0, "speed/wps": 5522.003532556422, "speed/FLOPS": 244044291962704.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.040599122643470764, "optim/lr": 2.8572898136110636e-05, "optim/total_tokens": 1937315463168, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3035635948181152, "created_at": "2025-06-03T04:19:29.339724+00:00"} {"global_step": 230947, "acc_step": 0, "speed/wps": 5529.156027130493, "speed/FLOPS": 244360395613092.56, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045441433787345886, "optim/lr": 2.856935091101609e-05, "optim/total_tokens": 1937323851776, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2867475748062134, "created_at": "2025-06-03T04:19:32.308425+00:00"} {"global_step": 230948, "acc_step": 0, "speed/wps": 5514.169821882886, "speed/FLOPS": 243698082047500.38, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05158618465065956, "optim/lr": 2.8565803685921543e-05, "optim/total_tokens": 1937332240384, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2922245264053345, "created_at": "2025-06-03T04:19:35.283348+00:00"} {"global_step": 230949, "acc_step": 0, "speed/wps": 5518.448259255714, "speed/FLOPS": 243887167080351.72, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04260149970650673, "optim/lr": 2.8562256460826997e-05, "optim/total_tokens": 1937340628992, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2974551916122437, "created_at": "2025-06-03T04:19:38.259288+00:00"} {"global_step": 230950, "acc_step": 0, "speed/wps": 5515.6862423518205, "speed/FLOPS": 243765100070483.7, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04622196778655052, "optim/lr": 2.855870923573267e-05, "optim/total_tokens": 1937349017600, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2989139556884766, "created_at": "2025-06-03T04:19:41.233262+00:00"} {"global_step": 230951, "acc_step": 0, "speed/wps": 5510.689335333845, "speed/FLOPS": 243544262356777.84, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.65 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.65, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042327411472797394, "optim/lr": 2.8555162010638124e-05, "optim/total_tokens": 1937357406208, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3047382831573486, "created_at": "2025-06-03T04:19:44.213975+00:00"} {"global_step": 230952, "acc_step": 0, "speed/wps": 5516.886073839279, "speed/FLOPS": 243818126480935.06, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046164028346538544, "optim/lr": 2.8551614785543578e-05, "optim/total_tokens": 1937365794816, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2947741746902466, "created_at": "2025-06-03T04:19:47.188624+00:00"} {"global_step": 230953, "acc_step": 0, "speed/wps": 5528.17740490251, "speed/FLOPS": 244317145519658.3, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041941314935684204, "optim/lr": 2.8548067560449255e-05, "optim/total_tokens": 1937374183424, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.281595230102539, "created_at": "2025-06-03T04:19:50.157215+00:00"} {"global_step": 230954, "acc_step": 0, "speed/wps": 5521.51321663712, "speed/FLOPS": 244022622508735.84, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04245720058679581, "optim/lr": 2.854452033535471e-05, "optim/total_tokens": 1937382572032, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3184633255004883, "created_at": "2025-06-03T04:19:53.128268+00:00"} {"global_step": 230955, "acc_step": 0, "speed/wps": 5528.449177929056, "speed/FLOPS": 244329156496371.2, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.02, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04331168532371521, "optim/lr": 2.854097311026016e-05, "optim/total_tokens": 1937390960640, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2989473342895508, "created_at": "2025-06-03T04:19:56.095163+00:00"} {"global_step": 230956, "acc_step": 0, "speed/wps": 5520.732474457307, "speed/FLOPS": 243988117700588.84, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04364321380853653, "optim/lr": 2.8537425885165612e-05, "optim/total_tokens": 1937399349248, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2805432081222534, "created_at": "2025-06-03T04:19:59.069012+00:00"} {"global_step": 230957, "acc_step": 0, "speed/wps": 5522.801798880115, "speed/FLOPS": 244079571248314.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04868677258491516, "optim/lr": 2.853387866007129e-05, "optim/total_tokens": 1937407737856, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2891581058502197, "created_at": "2025-06-03T04:20:02.040576+00:00"} {"global_step": 230958, "acc_step": 0, "speed/wps": 5520.3904465964515, "speed/FLOPS": 243973001819796.3, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04134465008974075, "optim/lr": 2.8530331434976743e-05, "optim/total_tokens": 1937416126464, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2917567491531372, "created_at": "2025-06-03T04:20:05.015613+00:00"} {"global_step": 230959, "acc_step": 0, "speed/wps": 5508.78451235642, "speed/FLOPS": 243460078930943.53, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.64 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.64, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042948052287101746, "optim/lr": 2.8526784209882197e-05, "optim/total_tokens": 1937424515072, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3042293787002563, "created_at": "2025-06-03T04:20:07.993004+00:00"} {"global_step": 230960, "acc_step": 0, "speed/wps": 5515.228649679861, "speed/FLOPS": 243744876816554.7, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041794728487730026, "optim/lr": 2.8523236984787647e-05, "optim/total_tokens": 1937432903680, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2983152866363525, "created_at": "2025-06-03T04:20:10.967277+00:00"} {"global_step": 230961, "acc_step": 0, "speed/wps": 5524.118059669436, "speed/FLOPS": 244137743237968.9, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04251587390899658, "optim/lr": 2.8519689759693324e-05, "optim/total_tokens": 1937441292288, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3027284145355225, "created_at": "2025-06-03T04:20:13.940084+00:00"} {"global_step": 230962, "acc_step": 0, "speed/wps": 5534.982713475952, "speed/FLOPS": 244617905325877.5, "speed/curr_iter_time": 2.958, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.958, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041302744299173355, "optim/lr": 2.8516142534598778e-05, "optim/total_tokens": 1937449680896, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3284237384796143, "created_at": "2025-06-03T04:20:16.906770+00:00"} {"global_step": 230963, "acc_step": 0, "speed/wps": 5518.207790626726, "speed/FLOPS": 243876539597780.44, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043187595903873444, "optim/lr": 2.851259530950423e-05, "optim/total_tokens": 1937458069504, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2999998331069946, "created_at": "2025-06-03T04:20:19.883114+00:00"} {"global_step": 230964, "acc_step": 0, "speed/wps": 5523.469250961502, "speed/FLOPS": 244109069213982.25, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.048023521900177, "optim/lr": 2.8509048084409685e-05, "optim/total_tokens": 1937466458112, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3049027919769287, "created_at": "2025-06-03T04:20:22.856188+00:00"} {"global_step": 230965, "acc_step": 0, "speed/wps": 5517.167675623651, "speed/FLOPS": 243830571838435.75, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.043812043964862823, "optim/lr": 2.850550085931536e-05, "optim/total_tokens": 1937474846720, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2975279092788696, "created_at": "2025-06-03T04:20:25.834188+00:00"} {"global_step": 230966, "acc_step": 0, "speed/wps": 5520.829639610609, "speed/FLOPS": 243992411903028.44, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042796142399311066, "optim/lr": 2.8501953634220812e-05, "optim/total_tokens": 1937483235328, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3121113777160645, "created_at": "2025-06-03T04:20:28.805911+00:00"} {"global_step": 230967, "acc_step": 0, "speed/wps": 5511.015778067339, "speed/FLOPS": 243558689454712.9, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.63 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.63, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04435789957642555, "optim/lr": 2.8498406409126266e-05, "optim/total_tokens": 1937491623936, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3032817840576172, "created_at": "2025-06-03T04:20:31.783441+00:00"} {"global_step": 230968, "acc_step": 0, "speed/wps": 5520.399111941419, "speed/FLOPS": 243973384783690.6, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04121532291173935, "optim/lr": 2.849485918403172e-05, "optim/total_tokens": 1937500012544, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3051027059555054, "created_at": "2025-06-03T04:20:34.755924+00:00"} {"global_step": 230969, "acc_step": 0, "speed/wps": 5524.558572957298, "speed/FLOPS": 244157211670540.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04153955355286598, "optim/lr": 2.8491311958937393e-05, "optim/total_tokens": 1937508401152, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3006932735443115, "created_at": "2025-06-03T04:20:37.729542+00:00"} {"global_step": 230970, "acc_step": 0, "speed/wps": 5526.7896679496525, "speed/FLOPS": 244255814649423.66, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04182806238532066, "optim/lr": 2.8487764733842847e-05, "optim/total_tokens": 1937516789760, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3252167701721191, "created_at": "2025-06-03T04:20:40.697823+00:00"} {"global_step": 230971, "acc_step": 0, "speed/wps": 5521.448466336737, "speed/FLOPS": 244019760876880.97, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04224977642297745, "optim/lr": 2.84842175087483e-05, "optim/total_tokens": 1937525178368, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.287074327468872, "created_at": "2025-06-03T04:20:43.672483+00:00"} {"global_step": 230972, "acc_step": 0, "speed/wps": 5533.040640193175, "speed/FLOPS": 244532075627210.97, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 189.87, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04118410870432854, "optim/lr": 2.8480670283653754e-05, "optim/total_tokens": 1937533566976, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2999505996704102, "created_at": "2025-06-03T04:20:46.638019+00:00"} {"global_step": 230973, "acc_step": 0, "speed/wps": 5519.6807935385705, "speed/FLOPS": 243941638786971.6, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0421355776488781, "optim/lr": 2.8477123058559428e-05, "optim/total_tokens": 1937541955584, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2929050922393799, "created_at": "2025-06-03T04:20:49.610480+00:00"} {"global_step": 230974, "acc_step": 0, "speed/wps": 5518.606479949594, "speed/FLOPS": 243894159625174.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041172925382852554, "optim/lr": 2.847357583346488e-05, "optim/total_tokens": 1937550344192, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2909797430038452, "created_at": "2025-06-03T04:20:52.582649+00:00"} {"global_step": 230975, "acc_step": 0, "speed/wps": 5514.551323564916, "speed/FLOPS": 243714942469143.47, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0423845537006855, "optim/lr": 2.8470028608370335e-05, "optim/total_tokens": 1937558732800, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3034117221832275, "created_at": "2025-06-03T04:20:55.560465+00:00"} {"global_step": 230976, "acc_step": 0, "speed/wps": 5531.964706374586, "speed/FLOPS": 244484524859557.84, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 189.97, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04274765029549599, "optim/lr": 2.846648138327579e-05, "optim/total_tokens": 1937567121408, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2975326776504517, "created_at": "2025-06-03T04:20:58.527439+00:00"} {"global_step": 230977, "acc_step": 0, "speed/wps": 5519.634230777635, "speed/FLOPS": 243939580951268.06, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04679353907704353, "optim/lr": 2.8462934158181463e-05, "optim/total_tokens": 1937575510016, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3049508333206177, "created_at": "2025-06-03T04:21:01.499623+00:00"} {"global_step": 230978, "acc_step": 0, "speed/wps": 5514.2224538661185, "speed/FLOPS": 243700408111764.34, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.62 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.62, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04266805574297905, "optim/lr": 2.8459386933086916e-05, "optim/total_tokens": 1937583898624, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2964191436767578, "created_at": "2025-06-03T04:21:04.477807+00:00"} {"global_step": 230979, "acc_step": 0, "speed/wps": 5522.183268539756, "speed/FLOPS": 244052235373195.78, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04196006432175636, "optim/lr": 2.845583970799237e-05, "optim/total_tokens": 1937592287232, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3078070878982544, "created_at": "2025-06-03T04:21:07.448317+00:00"} {"global_step": 230980, "acc_step": 0, "speed/wps": 5518.627548336251, "speed/FLOPS": 243895090740026.72, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04166233167052269, "optim/lr": 2.8452292482898047e-05, "optim/total_tokens": 1937600675840, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.297612190246582, "created_at": "2025-06-03T04:21:10.421588+00:00"} {"global_step": 230981, "acc_step": 0, "speed/wps": 5533.874136887925, "speed/FLOPS": 244568911914896.06, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04112694039940834, "optim/lr": 2.8448745257803497e-05, "optim/total_tokens": 1937609064448, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.3119500875473022, "created_at": "2025-06-03T04:21:13.391833+00:00"} {"global_step": 230982, "acc_step": 0, "speed/wps": 5521.110397431117, "speed/FLOPS": 244004819961646.1, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.23, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042766641825437546, "optim/lr": 2.844519803270895e-05, "optim/total_tokens": 1937617453056, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.321357250213623, "created_at": "2025-06-03T04:21:16.367679+00:00"} {"global_step": 230983, "acc_step": 0, "speed/wps": 5518.351419382443, "speed/FLOPS": 243882887253624.53, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041817158460617065, "optim/lr": 2.8441650807614405e-05, "optim/total_tokens": 1937625841664, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.29916512966156, "created_at": "2025-06-03T04:21:19.340468+00:00"} {"global_step": 230984, "acc_step": 0, "speed/wps": 5514.317439411686, "speed/FLOPS": 243704605986698.3, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.041511647403240204, "optim/lr": 2.8438103582520082e-05, "optim/total_tokens": 1937634230272, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2910581827163696, "created_at": "2025-06-03T04:21:22.317439+00:00"} {"global_step": 230985, "acc_step": 0, "speed/wps": 5511.237198388038, "speed/FLOPS": 243568475099555.88, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.042629219591617584, "optim/lr": 2.8434556357425535e-05, "optim/total_tokens": 1937642618880, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3033881187438965, "created_at": "2025-06-03T04:21:25.294322+00:00"} {"global_step": 230986, "acc_step": 0, "speed/wps": 5546.682379473948, "speed/FLOPS": 245134970678669.72, "speed/curr_iter_time": 2.953, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.953, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04161900281906128, "optim/lr": 2.8431009132330986e-05, "optim/total_tokens": 1937651007488, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.308379888534546, "created_at": "2025-06-03T04:21:28.255229+00:00"} {"global_step": 230987, "acc_step": 0, "speed/wps": 5519.4774218045795, "speed/FLOPS": 243932650797280.1, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.0559610053896904, "optim/lr": 2.842746190723644e-05, "optim/total_tokens": 1937659396096, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.301782250404358, "created_at": "2025-06-03T04:21:31.227418+00:00"} {"global_step": 230988, "acc_step": 0, "speed/wps": 5520.14368168787, "speed/FLOPS": 243962096073894.3, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.049554355442523956, "optim/lr": 2.8423914682142116e-05, "optim/total_tokens": 1937667784704, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3021749258041382, "created_at": "2025-06-03T04:21:34.202660+00:00"} {"global_step": 230989, "acc_step": 0, "speed/wps": 5518.92483574665, "speed/FLOPS": 243908229321911.47, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04220138490200043, "optim/lr": 2.842036745704757e-05, "optim/total_tokens": 1937676173312, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2781956195831299, "created_at": "2025-06-03T04:21:37.177624+00:00"} {"global_step": 230990, "acc_step": 0, "speed/wps": 5518.189719910447, "speed/FLOPS": 243875740964615.22, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.05048394575715065, "optim/lr": 2.8416820231953024e-05, "optim/total_tokens": 1937684561920, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2939262390136719, "created_at": "2025-06-03T04:21:40.155654+00:00"} {"global_step": 230991, "acc_step": 0, "speed/wps": 5522.401825352922, "speed/FLOPS": 244061894465662.56, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04248989000916481, "optim/lr": 2.8413273006858474e-05, "optim/total_tokens": 1937692950528, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.312630295753479, "created_at": "2025-06-03T04:21:43.126294+00:00"} {"global_step": 230992, "acc_step": 0, "speed/wps": 5524.360279288859, "speed/FLOPS": 244148448105354.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05651233717799187, "optim/lr": 2.840972578176415e-05, "optim/total_tokens": 1937701339136, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3071972131729126, "created_at": "2025-06-03T04:21:46.096261+00:00"} {"global_step": 230993, "acc_step": 0, "speed/wps": 5518.433484196699, "speed/FLOPS": 243886514098368.84, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.046012863516807556, "optim/lr": 2.8406178556669605e-05, "optim/total_tokens": 1937709727744, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2915089130401611, "created_at": "2025-06-03T04:21:49.068702+00:00"} {"global_step": 230994, "acc_step": 0, "speed/wps": 5522.242475164672, "speed/FLOPS": 244054852002970.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04616517201066017, "optim/lr": 2.8402631331575058e-05, "optim/total_tokens": 1937718116352, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3048863410949707, "created_at": "2025-06-03T04:21:52.042748+00:00"} {"global_step": 230995, "acc_step": 0, "speed/wps": 5526.638369154663, "speed/FLOPS": 244249128017102.6, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04390852153301239, "optim/lr": 2.8399084106480512e-05, "optim/total_tokens": 1937726504960, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3029415607452393, "created_at": "2025-06-03T04:21:55.011691+00:00"} {"global_step": 230996, "acc_step": 0, "speed/wps": 5524.060953304406, "speed/FLOPS": 244135219428931.47, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 190.19, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0524478480219841, "optim/lr": 2.8395536881386186e-05, "optim/total_tokens": 1937734893568, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3036073446273804, "created_at": "2025-06-03T04:21:57.981462+00:00"} {"global_step": 230997, "acc_step": 0, "speed/wps": 5524.389298392214, "speed/FLOPS": 244149730601190.06, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05302472785115242, "optim/lr": 2.839198965629164e-05, "optim/total_tokens": 1937743282176, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.297556757926941, "created_at": "2025-06-03T04:22:00.951239+00:00"} {"global_step": 230998, "acc_step": 0, "speed/wps": 5512.524730949725, "speed/FLOPS": 243625377448593.38, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.045946016907691956, "optim/lr": 2.8388442431197093e-05, "optim/total_tokens": 1937751670784, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3067840337753296, "created_at": "2025-06-03T04:22:03.929006+00:00"} {"global_step": 230999, "acc_step": 0, "speed/wps": 5507.3959447518855, "speed/FLOPS": 243398711350156.38, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.61 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.61, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.056945402175188065, "optim/lr": 2.8384895206102547e-05, "optim/total_tokens": 1937760059392, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2886110544204712, "created_at": "2025-06-03T04:22:06.909754+00:00"} {"global_step": 231000, "acc_step": 0, "speed/wps": 5511.674224667452, "speed/FLOPS": 243587789424202.7, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.6 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.6, "speed/est_time_remaining_days": 0.28, "optim/grad_norm": 0.04104152321815491, "optim/lr": 2.838134798100822e-05, "optim/total_tokens": 1937768448000, "memory/max_active_gib": 82.15578985214233, "memory/max_active_pct": 64.1842108219862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3062807321548462, "created_at": "2025-06-03T04:22:09.886046+00:00"} {"global_step": 231001, "acc_step": 0, "speed/wps": 222.24579148073494, "speed/FLOPS": 9822126426365.639, "speed/curr_iter_time": 6.2905, "speed/data_load_time": 2.8693, "speed/curr_step_time": 6.2905, "speed/est_time_elapsed": "16.82 days", "speed/est_time_remaining": "13.98 hours", "speed/est_time_elapsed_hrs": 403.64, "speed/est_time_elapsed_days": 16.82, "speed/est_time_remaining_hrs": 13.98, "speed/est_time_remaining_days": 0.58, "optim/grad_norm": 0.048700619488954544, "optim/lr": 2.8377800755913674e-05, "optim/total_tokens": 1937776836608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3129266500473022, "created_at": "2025-06-03T04:23:23.613481+00:00"} {"global_step": 231002, "acc_step": 0, "speed/wps": 5611.875682859928, "speed/FLOPS": 248016180998753.62, "speed/curr_iter_time": 2.9164, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9164, "speed/est_time_elapsed": "7.8 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 187.14, "speed/est_time_elapsed_days": 7.8, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04216621071100235, "optim/lr": 2.8374253530819128e-05, "optim/total_tokens": 1937785225216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3015711307525635, "created_at": "2025-06-03T04:23:26.538553+00:00"} {"global_step": 231003, "acc_step": 0, "speed/wps": 5558.19221589499, "speed/FLOPS": 245643646535796.44, "speed/curr_iter_time": 2.9465, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9465, "speed/est_time_elapsed": "7.88 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 189.07, "speed/est_time_elapsed_days": 7.88, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04301171004772186, "optim/lr": 2.837070630572458e-05, "optim/total_tokens": 1937793613824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2916160821914673, "created_at": "2025-06-03T04:23:29.492830+00:00"} {"global_step": 231004, "acc_step": 0, "speed/wps": 5582.778504749919, "speed/FLOPS": 246730234659149.9, "speed/curr_iter_time": 2.9337, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9337, "speed/est_time_elapsed": "7.84 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 188.25, "speed/est_time_elapsed_days": 7.84, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04316103085875511, "optim/lr": 2.8367159080630255e-05, "optim/total_tokens": 1937802002432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2967756986618042, "created_at": "2025-06-03T04:23:32.433142+00:00"} {"global_step": 231005, "acc_step": 0, "speed/wps": 5570.525769630203, "speed/FLOPS": 246188726482042.06, "speed/curr_iter_time": 2.9391, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9391, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 188.6, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04448253661394119, "optim/lr": 2.836361185553571e-05, "optim/total_tokens": 1937810391040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.295555591583252, "created_at": "2025-06-03T04:23:35.383774+00:00"} {"global_step": 231006, "acc_step": 0, "speed/wps": 5536.104314434017, "speed/FLOPS": 244667474347349.9, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 189.84, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04202442988753319, "optim/lr": 2.8360064630441162e-05, "optim/total_tokens": 1937818779648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3027938604354858, "created_at": "2025-06-03T04:23:38.352418+00:00"} {"global_step": 231007, "acc_step": 0, "speed/wps": 5542.28617090358, "speed/FLOPS": 244940680761694.75, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.63, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04306884855031967, "optim/lr": 2.8356517405346836e-05, "optim/total_tokens": 1937827168256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3011035919189453, "created_at": "2025-06-03T04:23:41.312767+00:00"} {"global_step": 231008, "acc_step": 0, "speed/wps": 5541.089867714626, "speed/FLOPS": 244887810283977.8, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.68, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.040602054446935654, "optim/lr": 2.835297018025229e-05, "optim/total_tokens": 1937835556864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2966786623001099, "created_at": "2025-06-03T04:23:44.276571+00:00"} {"global_step": 231009, "acc_step": 0, "speed/wps": 5528.929289282709, "speed/FLOPS": 244350374960770.0, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043039221316576004, "optim/lr": 2.8349422955157743e-05, "optim/total_tokens": 1937843945472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2963531017303467, "created_at": "2025-06-03T04:23:47.243475+00:00"} {"global_step": 231010, "acc_step": 0, "speed/wps": 5530.68685027695, "speed/FLOPS": 244428050160702.78, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04454119876027107, "optim/lr": 2.8345875730063197e-05, "optim/total_tokens": 1937852334080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2804481983184814, "created_at": "2025-06-03T04:23:50.214103+00:00"} {"global_step": 231011, "acc_step": 0, "speed/wps": 5528.8829808681985, "speed/FLOPS": 244348328365876.6, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.1, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04685361310839653, "optim/lr": 2.8342328504968874e-05, "optim/total_tokens": 1937860722688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3102593421936035, "created_at": "2025-06-03T04:23:53.181141+00:00"} {"global_step": 231012, "acc_step": 0, "speed/wps": 5541.293713829865, "speed/FLOPS": 244896819238892.38, "speed/curr_iter_time": 2.9548, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9548, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.61, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04199262708425522, "optim/lr": 2.8338781279874328e-05, "optim/total_tokens": 1937869111296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3135689496994019, "created_at": "2025-06-03T04:23:56.145825+00:00"} {"global_step": 231013, "acc_step": 0, "speed/wps": 5536.024845079408, "speed/FLOPS": 244663962208637.2, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04518797993659973, "optim/lr": 2.8335234054779778e-05, "optim/total_tokens": 1937877499904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3057032823562622, "created_at": "2025-06-03T04:23:59.110055+00:00"} {"global_step": 231014, "acc_step": 0, "speed/wps": 5535.060342617861, "speed/FLOPS": 244621336136607.97, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04623826593160629, "optim/lr": 2.833168682968523e-05, "optim/total_tokens": 1937885888512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2954535484313965, "created_at": "2025-06-03T04:24:02.073806+00:00"} {"global_step": 231015, "acc_step": 0, "speed/wps": 5522.455145510537, "speed/FLOPS": 244064250943711.8, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.58 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.58, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05584334209561348, "optim/lr": 2.832813960459091e-05, "optim/total_tokens": 1937894277120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2985355854034424, "created_at": "2025-06-03T04:24:05.048095+00:00"} {"global_step": 231016, "acc_step": 0, "speed/wps": 5533.698977648759, "speed/FLOPS": 244561170773071.22, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.88, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044778287410736084, "optim/lr": 2.8324592379496362e-05, "optim/total_tokens": 1937902665728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3238861560821533, "created_at": "2025-06-03T04:24:08.012737+00:00"} {"global_step": 231017, "acc_step": 0, "speed/wps": 5545.829241971106, "speed/FLOPS": 245097266367797.72, "speed/curr_iter_time": 2.9535, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9535, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.056831784546375275, "optim/lr": 2.8321045154401816e-05, "optim/total_tokens": 1937911054336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2987743616104126, "created_at": "2025-06-03T04:24:10.974953+00:00"} {"global_step": 231018, "acc_step": 0, "speed/wps": 5530.25469699297, "speed/FLOPS": 244408951197511.88, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0429287888109684, "optim/lr": 2.8317497929307266e-05, "optim/total_tokens": 1937919442944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3051583766937256, "created_at": "2025-06-03T04:24:13.943724+00:00"} {"global_step": 231019, "acc_step": 0, "speed/wps": 5525.912685647541, "speed/FLOPS": 244217056520472.7, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05207115784287453, "optim/lr": 2.8313950704212943e-05, "optim/total_tokens": 1937927831552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2982900142669678, "created_at": "2025-06-03T04:24:16.912316+00:00"} {"global_step": 231020, "acc_step": 0, "speed/wps": 5505.432471631457, "speed/FLOPS": 243311935888199.9, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.59 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.59, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04673953726887703, "optim/lr": 2.8310403479118397e-05, "optim/total_tokens": 1937936220160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2786506414413452, "created_at": "2025-06-03T04:24:19.892232+00:00"} {"global_step": 231021, "acc_step": 0, "speed/wps": 5536.512946651121, "speed/FLOPS": 244685533799776.56, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.85, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05483845993876457, "optim/lr": 2.830685625402385e-05, "optim/total_tokens": 1937944608768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.297478437423706, "created_at": "2025-06-03T04:24:22.855249+00:00"} {"global_step": 231022, "acc_step": 0, "speed/wps": 5540.825220146684, "speed/FLOPS": 244876114216063.8, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 189.64, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04412476718425751, "optim/lr": 2.8303309028929304e-05, "optim/total_tokens": 1937952997376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.298600435256958, "created_at": "2025-06-03T04:24:25.821405+00:00"} {"global_step": 231023, "acc_step": 0, "speed/wps": 5527.338135671419, "speed/FLOPS": 244280054115413.47, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05450573191046715, "optim/lr": 2.8299761803834978e-05, "optim/total_tokens": 1937961385984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2947330474853516, "created_at": "2025-06-03T04:24:28.793690+00:00"} {"global_step": 231024, "acc_step": 0, "speed/wps": 5530.2071303331195, "speed/FLOPS": 244406848994614.72, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.07, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04257499426603317, "optim/lr": 2.8296214578740432e-05, "optim/total_tokens": 1937969774592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.290185809135437, "created_at": "2025-06-03T04:24:31.763031+00:00"} {"global_step": 231025, "acc_step": 0, "speed/wps": 5535.235784854704, "speed/FLOPS": 244629089785481.66, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04699118807911873, "optim/lr": 2.8292667353645885e-05, "optim/total_tokens": 1937978163200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2903863191604614, "created_at": "2025-06-03T04:24:34.727368+00:00"} {"global_step": 231026, "acc_step": 0, "speed/wps": 5528.892983499982, "speed/FLOPS": 244348770431003.28, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.05, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045188724994659424, "optim/lr": 2.828912012855134e-05, "optim/total_tokens": 1937986551808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2978298664093018, "created_at": "2025-06-03T04:24:37.696952+00:00"} {"global_step": 231027, "acc_step": 0, "speed/wps": 5525.904653022667, "speed/FLOPS": 244216701519567.94, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04144107922911644, "optim/lr": 2.8285572903457013e-05, "optim/total_tokens": 1937994940416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3117300271987915, "created_at": "2025-06-03T04:24:40.666150+00:00"} {"global_step": 231028, "acc_step": 0, "speed/wps": 5523.313173880231, "speed/FLOPS": 244102171405865.0, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04681464657187462, "optim/lr": 2.8282025678362466e-05, "optim/total_tokens": 1938003329024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3016557693481445, "created_at": "2025-06-03T04:24:43.638449+00:00"} {"global_step": 231029, "acc_step": 0, "speed/wps": 5532.204167811513, "speed/FLOPS": 244495107829395.28, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 189.94, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0410732701420784, "optim/lr": 2.827847845326792e-05, "optim/total_tokens": 1938011717632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2794809341430664, "created_at": "2025-06-03T04:24:46.607110+00:00"} {"global_step": 231030, "acc_step": 0, "speed/wps": 5546.0943843929035, "speed/FLOPS": 245108984305719.22, "speed/curr_iter_time": 2.9533, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9533, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04550684243440628, "optim/lr": 2.8274931228173374e-05, "optim/total_tokens": 1938020106240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2933913469314575, "created_at": "2025-06-03T04:24:49.567432+00:00"} {"global_step": 231031, "acc_step": 0, "speed/wps": 5527.672112743596, "speed/FLOPS": 244294814192554.06, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04075944796204567, "optim/lr": 2.8271384003079047e-05, "optim/total_tokens": 1938028494848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3009672164916992, "created_at": "2025-06-03T04:24:52.534928+00:00"} {"global_step": 231032, "acc_step": 0, "speed/wps": 5537.436701364628, "speed/FLOPS": 244726359029908.34, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0468614436686039, "optim/lr": 2.82678367779845e-05, "optim/total_tokens": 1938036883456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2881795167922974, "created_at": "2025-06-03T04:24:55.497213+00:00"} {"global_step": 231033, "acc_step": 0, "speed/wps": 5529.0683555931255, "speed/FLOPS": 244356520979884.5, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.11, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041101254522800446, "optim/lr": 2.8264289552889955e-05, "optim/total_tokens": 1938045272064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2986037731170654, "created_at": "2025-06-03T04:24:58.463947+00:00"} {"global_step": 231034, "acc_step": 0, "speed/wps": 5514.943016976925, "speed/FLOPS": 243732253313085.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04616222158074379, "optim/lr": 2.826074232779563e-05, "optim/total_tokens": 1938053660672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2970242500305176, "created_at": "2025-06-03T04:25:01.442117+00:00"} {"global_step": 231035, "acc_step": 0, "speed/wps": 5520.838550626508, "speed/FLOPS": 243992805724320.44, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041840653866529465, "optim/lr": 2.8257195102701082e-05, "optim/total_tokens": 1938062049280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3018288612365723, "created_at": "2025-06-03T04:25:04.417916+00:00"} {"global_step": 231036, "acc_step": 0, "speed/wps": 5512.805141368517, "speed/FLOPS": 243637770153833.34, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04839467629790306, "optim/lr": 2.8253647877606536e-05, "optim/total_tokens": 1938070437888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3008084297180176, "created_at": "2025-06-03T04:25:07.394736+00:00"} {"global_step": 231037, "acc_step": 0, "speed/wps": 5525.24814224979, "speed/FLOPS": 244187687103733.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04263799265027046, "optim/lr": 2.825010065251199e-05, "optim/total_tokens": 1938078826496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2873761653900146, "created_at": "2025-06-03T04:25:10.363720+00:00"} {"global_step": 231038, "acc_step": 0, "speed/wps": 5524.67556172128, "speed/FLOPS": 244162381975106.25, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04973887652158737, "optim/lr": 2.8246553427417666e-05, "optim/total_tokens": 1938087215104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3027172088623047, "created_at": "2025-06-03T04:25:13.336426+00:00"} {"global_step": 231039, "acc_step": 0, "speed/wps": 5529.408767562476, "speed/FLOPS": 244371565446543.38, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044768039137125015, "optim/lr": 2.8243006202323117e-05, "optim/total_tokens": 1938095603712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2940218448638916, "created_at": "2025-06-03T04:25:16.303048+00:00"} {"global_step": 231040, "acc_step": 0, "speed/wps": 5520.976777061532, "speed/FLOPS": 243998914625241.47, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043658796697854996, "optim/lr": 2.823945897722857e-05, "optim/total_tokens": 1938103992320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.302668571472168, "created_at": "2025-06-03T04:25:19.274137+00:00"} {"global_step": 231041, "acc_step": 0, "speed/wps": 5532.681088362654, "speed/FLOPS": 244516185276655.03, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04303309693932533, "optim/lr": 2.8235911752134024e-05, "optim/total_tokens": 1938112380928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2919609546661377, "created_at": "2025-06-03T04:25:22.242650+00:00"} {"global_step": 231042, "acc_step": 0, "speed/wps": 5512.438038586519, "speed/FLOPS": 243621546089871.4, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04298417270183563, "optim/lr": 2.82323645270397e-05, "optim/total_tokens": 1938120769536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3017631769180298, "created_at": "2025-06-03T04:25:25.218566+00:00"} {"global_step": 231043, "acc_step": 0, "speed/wps": 5519.254353182674, "speed/FLOPS": 243922792305960.6, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041963815689086914, "optim/lr": 2.8228817301945155e-05, "optim/total_tokens": 1938129158144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3009380102157593, "created_at": "2025-06-03T04:25:28.190586+00:00"} {"global_step": 231044, "acc_step": 0, "speed/wps": 5528.680691858869, "speed/FLOPS": 244339388227073.25, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042199745774269104, "optim/lr": 2.8225270076850605e-05, "optim/total_tokens": 1938137546752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3014215230941772, "created_at": "2025-06-03T04:25:31.163223+00:00"} {"global_step": 231045, "acc_step": 0, "speed/wps": 5501.06187047907, "speed/FLOPS": 243118777688029.1, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.58 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.58, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041724126785993576, "optim/lr": 2.822172285175606e-05, "optim/total_tokens": 1938145935360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.279431939125061, "created_at": "2025-06-03T04:25:34.146313+00:00"} {"global_step": 231046, "acc_step": 0, "speed/wps": 5520.74952968696, "speed/FLOPS": 243988871454442.9, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04224938526749611, "optim/lr": 2.8218175626661736e-05, "optim/total_tokens": 1938154323968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3053572177886963, "created_at": "2025-06-03T04:25:37.117615+00:00"} {"global_step": 231047, "acc_step": 0, "speed/wps": 5521.760467101444, "speed/FLOPS": 244033549713716.34, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042301733046770096, "optim/lr": 2.821462840156719e-05, "optim/total_tokens": 1938162712576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2894774675369263, "created_at": "2025-06-03T04:25:40.091328+00:00"} {"global_step": 231048, "acc_step": 0, "speed/wps": 5522.983515379432, "speed/FLOPS": 244087602187474.84, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04284586012363434, "optim/lr": 2.8211081176472643e-05, "optim/total_tokens": 1938171101184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2929847240447998, "created_at": "2025-06-03T04:25:43.061345+00:00"} {"global_step": 231049, "acc_step": 0, "speed/wps": 5515.635672717326, "speed/FLOPS": 243762865151477.9, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04172053560614586, "optim/lr": 2.8207533951378093e-05, "optim/total_tokens": 1938179489792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3074586391448975, "created_at": "2025-06-03T04:25:46.040983+00:00"} {"global_step": 231050, "acc_step": 0, "speed/wps": 5507.049499109798, "speed/FLOPS": 243383400226045.66, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.57 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.57, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04439956322312355, "optim/lr": 2.820398672628377e-05, "optim/total_tokens": 1938187878400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3202457427978516, "created_at": "2025-06-03T04:25:49.019783+00:00"} {"global_step": 231051, "acc_step": 0, "speed/wps": 5514.652013001917, "speed/FLOPS": 243719392426883.66, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044702187180519104, "optim/lr": 2.8200439501189224e-05, "optim/total_tokens": 1938196267008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3066221475601196, "created_at": "2025-06-03T04:25:51.996370+00:00"} {"global_step": 231052, "acc_step": 0, "speed/wps": 5518.587086615899, "speed/FLOPS": 243893302539089.03, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042245637625455856, "optim/lr": 2.8196892276094678e-05, "optim/total_tokens": 1938204655616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2911494970321655, "created_at": "2025-06-03T04:25:54.969001+00:00"} {"global_step": 231053, "acc_step": 0, "speed/wps": 5512.668233736186, "speed/FLOPS": 243631719537241.12, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04530429095029831, "optim/lr": 2.819334505100013e-05, "optim/total_tokens": 1938213044224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.296426773071289, "created_at": "2025-06-03T04:25:57.947881+00:00"} {"global_step": 231054, "acc_step": 0, "speed/wps": 5513.9129746774925, "speed/FLOPS": 243686730715685.16, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.56 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.56, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042856790125370026, "optim/lr": 2.8189797825905805e-05, "optim/total_tokens": 1938221432832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3104782104492188, "created_at": "2025-06-03T04:26:00.922933+00:00"} {"global_step": 231055, "acc_step": 0, "speed/wps": 5529.404966231268, "speed/FLOPS": 244371397447160.97, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.047436535358428955, "optim/lr": 2.818625060081126e-05, "optim/total_tokens": 1938229821440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2859934568405151, "created_at": "2025-06-03T04:26:03.894176+00:00"} {"global_step": 231056, "acc_step": 0, "speed/wps": 5527.053160918008, "speed/FLOPS": 244267459689945.72, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041908904910087585, "optim/lr": 2.8182703375716712e-05, "optim/total_tokens": 1938238210048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.299614667892456, "created_at": "2025-06-03T04:26:06.862804+00:00"} {"global_step": 231057, "acc_step": 0, "speed/wps": 5524.022794298301, "speed/FLOPS": 244133532996177.12, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04495657607913017, "optim/lr": 2.8179156150622166e-05, "optim/total_tokens": 1938246598656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.301016926765442, "created_at": "2025-06-03T04:26:09.834901+00:00"} {"global_step": 231058, "acc_step": 0, "speed/wps": 5520.369958484097, "speed/FLOPS": 243972096350097.9, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044271960854530334, "optim/lr": 2.817560892552784e-05, "optim/total_tokens": 1938254987264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2905354499816895, "created_at": "2025-06-03T04:26:12.806930+00:00"} {"global_step": 231059, "acc_step": 0, "speed/wps": 5510.54244233402, "speed/FLOPS": 243537770438052.12, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041563719511032104, "optim/lr": 2.8172061700433293e-05, "optim/total_tokens": 1938263375872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2960231304168701, "created_at": "2025-06-03T04:26:15.786831+00:00"} {"global_step": 231060, "acc_step": 0, "speed/wps": 5517.805331970959, "speed/FLOPS": 243858752985165.7, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0428413525223732, "optim/lr": 2.8168514475338747e-05, "optim/total_tokens": 1938271764480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.301609754562378, "created_at": "2025-06-03T04:26:18.760205+00:00"} {"global_step": 231061, "acc_step": 0, "speed/wps": 5521.079657952926, "speed/FLOPS": 244003461434048.97, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04080500453710556, "optim/lr": 2.816496725024442e-05, "optim/total_tokens": 1938280153088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2777023315429688, "created_at": "2025-06-03T04:26:21.731207+00:00"} {"global_step": 231062, "acc_step": 0, "speed/wps": 5516.844969414588, "speed/FLOPS": 243816309875755.28, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04232130944728851, "optim/lr": 2.8161420025149874e-05, "optim/total_tokens": 1938288541696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2945202589035034, "created_at": "2025-06-03T04:26:24.708095+00:00"} {"global_step": 231063, "acc_step": 0, "speed/wps": 5525.206162603485, "speed/FLOPS": 244185831818238.16, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042014773935079575, "optim/lr": 2.8157872800055328e-05, "optim/total_tokens": 1938296930304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3109591007232666, "created_at": "2025-06-03T04:26:27.681913+00:00"} {"global_step": 231064, "acc_step": 0, "speed/wps": 5523.01334840694, "speed/FLOPS": 244088920654591.4, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04232156276702881, "optim/lr": 2.815432557496078e-05, "optim/total_tokens": 1938305318912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.288311243057251, "created_at": "2025-06-03T04:26:30.654824+00:00"} {"global_step": 231065, "acc_step": 0, "speed/wps": 5520.873471188238, "speed/FLOPS": 243994349034409.28, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04229424148797989, "optim/lr": 2.815077834986646e-05, "optim/total_tokens": 1938313707520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2866500616073608, "created_at": "2025-06-03T04:26:33.626526+00:00"} {"global_step": 231066, "acc_step": 0, "speed/wps": 5520.828973873591, "speed/FLOPS": 243992382480859.8, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04617098718881607, "optim/lr": 2.814723112477191e-05, "optim/total_tokens": 1938322096128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3004285097122192, "created_at": "2025-06-03T04:26:36.601530+00:00"} {"global_step": 231067, "acc_step": 0, "speed/wps": 5516.770127933411, "speed/FLOPS": 243813002265360.66, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046355243772268295, "optim/lr": 2.8143683899677363e-05, "optim/total_tokens": 1938330484736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2971434593200684, "created_at": "2025-06-03T04:26:39.576316+00:00"} {"global_step": 231068, "acc_step": 0, "speed/wps": 5528.101255917997, "speed/FLOPS": 244313780124308.7, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04285688325762749, "optim/lr": 2.8140136674582816e-05, "optim/total_tokens": 1938338873344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.291072130203247, "created_at": "2025-06-03T04:26:42.543770+00:00"} {"global_step": 231069, "acc_step": 0, "speed/wps": 5504.78776286562, "speed/FLOPS": 243283443060668.53, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041628699749708176, "optim/lr": 2.8136589449488493e-05, "optim/total_tokens": 1938347261952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3058191537857056, "created_at": "2025-06-03T04:26:45.523530+00:00"} {"global_step": 231070, "acc_step": 0, "speed/wps": 5509.817799868777, "speed/FLOPS": 243505744950144.75, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042480841279029846, "optim/lr": 2.8133042224393947e-05, "optim/total_tokens": 1938355650560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2958383560180664, "created_at": "2025-06-03T04:26:48.500352+00:00"} {"global_step": 231071, "acc_step": 0, "speed/wps": 5507.280834018704, "speed/FLOPS": 243393624044939.9, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.55 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.55, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04229343309998512, "optim/lr": 2.8129494999299397e-05, "optim/total_tokens": 1938364039168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2870198488235474, "created_at": "2025-06-03T04:26:51.479096+00:00"} {"global_step": 231072, "acc_step": 0, "speed/wps": 5528.422770799002, "speed/FLOPS": 244327989436386.78, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042119305580854416, "optim/lr": 2.812594777420485e-05, "optim/total_tokens": 1938372427776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2991816997528076, "created_at": "2025-06-03T04:26:54.446075+00:00"} {"global_step": 231073, "acc_step": 0, "speed/wps": 5522.89798140015, "speed/FLOPS": 244083822023393.16, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04251391068100929, "optim/lr": 2.8122400549110528e-05, "optim/total_tokens": 1938380816384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2954579591751099, "created_at": "2025-06-03T04:26:57.416074+00:00"} {"global_step": 231074, "acc_step": 0, "speed/wps": 5512.373355867852, "speed/FLOPS": 243618687444782.5, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04225144907832146, "optim/lr": 2.8118853324015982e-05, "optim/total_tokens": 1938389204992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2936309576034546, "created_at": "2025-06-03T04:27:00.391788+00:00"} {"global_step": 231075, "acc_step": 0, "speed/wps": 5528.260093605075, "speed/FLOPS": 244320799937072.56, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04340550675988197, "optim/lr": 2.8115306098921435e-05, "optim/total_tokens": 1938397593600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2903339862823486, "created_at": "2025-06-03T04:27:03.359247+00:00"} {"global_step": 231076, "acc_step": 0, "speed/wps": 5517.573284686041, "speed/FLOPS": 243848497682898.0, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042244795709848404, "optim/lr": 2.8111758873826886e-05, "optim/total_tokens": 1938405982208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3018141984939575, "created_at": "2025-06-03T04:27:06.332416+00:00"} {"global_step": 231077, "acc_step": 0, "speed/wps": 5514.108542677046, "speed/FLOPS": 243695373820257.66, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043441783636808395, "optim/lr": 2.8108211648732563e-05, "optim/total_tokens": 1938414370816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2953917980194092, "created_at": "2025-06-03T04:27:09.307017+00:00"} {"global_step": 231078, "acc_step": 0, "speed/wps": 5521.851550660811, "speed/FLOPS": 244037575140832.44, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04427577555179596, "optim/lr": 2.8104664423638016e-05, "optim/total_tokens": 1938422759424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2992637157440186, "created_at": "2025-06-03T04:27:12.280740+00:00"} {"global_step": 231079, "acc_step": 0, "speed/wps": 5526.513041064073, "speed/FLOPS": 244243589156985.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0478806234896183, "optim/lr": 2.810111719854347e-05, "optim/total_tokens": 1938431148032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2993944883346558, "created_at": "2025-06-03T04:27:15.248673+00:00"} {"global_step": 231080, "acc_step": 0, "speed/wps": 5506.089891842717, "speed/FLOPS": 243340990496555.94, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.54 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.54, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045195307582616806, "optim/lr": 2.8097569973448924e-05, "optim/total_tokens": 1938439536640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.295063853263855, "created_at": "2025-06-03T04:27:18.228048+00:00"} {"global_step": 231081, "acc_step": 0, "speed/wps": 5523.08240532976, "speed/FLOPS": 244091972617114.7, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04663928598165512, "optim/lr": 2.8094022748354597e-05, "optim/total_tokens": 1938447925248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.303430438041687, "created_at": "2025-06-03T04:27:21.198803+00:00"} {"global_step": 231082, "acc_step": 0, "speed/wps": 5526.242986436501, "speed/FLOPS": 244231654124712.03, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.047856446355581284, "optim/lr": 2.809047552326005e-05, "optim/total_tokens": 1938456313856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3074266910552979, "created_at": "2025-06-03T04:27:24.167721+00:00"} {"global_step": 231083, "acc_step": 0, "speed/wps": 5521.848221611527, "speed/FLOPS": 244037428013893.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04230394959449768, "optim/lr": 2.8086928298165505e-05, "optim/total_tokens": 1938464702464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3071365356445312, "created_at": "2025-06-03T04:27:27.138276+00:00"} {"global_step": 231084, "acc_step": 0, "speed/wps": 5511.781456281377, "speed/FLOPS": 243592528512677.03, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04231585934758186, "optim/lr": 2.8083381073070958e-05, "optim/total_tokens": 1938473091072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3049933910369873, "created_at": "2025-06-03T04:27:30.114369+00:00"} {"global_step": 231085, "acc_step": 0, "speed/wps": 5511.237205725863, "speed/FLOPS": 243568475423850.16, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0415085107088089, "optim/lr": 2.8079833847976632e-05, "optim/total_tokens": 1938481479680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3096657991409302, "created_at": "2025-06-03T04:27:33.090699+00:00"} {"global_step": 231086, "acc_step": 0, "speed/wps": 5515.6876495990755, "speed/FLOPS": 243765162263609.4, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0420021153986454, "optim/lr": 2.8076286622882086e-05, "optim/total_tokens": 1938489868288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294122576713562, "created_at": "2025-06-03T04:27:36.069354+00:00"} {"global_step": 231087, "acc_step": 0, "speed/wps": 5513.935084798555, "speed/FLOPS": 243687707869866.25, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041127558797597885, "optim/lr": 2.807273939778754e-05, "optim/total_tokens": 1938498256896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2926534414291382, "created_at": "2025-06-03T04:27:39.048058+00:00"} {"global_step": 231088, "acc_step": 0, "speed/wps": 5525.1265715700665, "speed/FLOPS": 244182314301944.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04270993918180466, "optim/lr": 2.8069192172693213e-05, "optim/total_tokens": 1938506645504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2943205833435059, "created_at": "2025-06-03T04:27:42.018028+00:00"} {"global_step": 231089, "acc_step": 0, "speed/wps": 5522.807620121191, "speed/FLOPS": 244079828517374.12, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04116489738225937, "optim/lr": 2.8065644947598667e-05, "optim/total_tokens": 1938515034112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.295130968093872, "created_at": "2025-06-03T04:27:44.990704+00:00"} {"global_step": 231090, "acc_step": 0, "speed/wps": 5515.871962394263, "speed/FLOPS": 243773307945758.3, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04368146136403084, "optim/lr": 2.806209772250412e-05, "optim/total_tokens": 1938523422720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3058760166168213, "created_at": "2025-06-03T04:27:47.965882+00:00"} {"global_step": 231091, "acc_step": 0, "speed/wps": 5508.722633903723, "speed/FLOPS": 243457344220056.94, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.048125963658094406, "optim/lr": 2.8058550497409574e-05, "optim/total_tokens": 1938531811328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3020223379135132, "created_at": "2025-06-03T04:27:50.947717+00:00"} {"global_step": 231092, "acc_step": 0, "speed/wps": 5514.489642194187, "speed/FLOPS": 243712216468271.1, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041190922260284424, "optim/lr": 2.8055003272315248e-05, "optim/total_tokens": 1938540199936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.305397629737854, "created_at": "2025-06-03T04:27:53.927351+00:00"} {"global_step": 231093, "acc_step": 0, "speed/wps": 5511.479626173264, "speed/FLOPS": 243579189166804.94, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.53 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.53, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046085599809885025, "optim/lr": 2.80514560472207e-05, "optim/total_tokens": 1938548588544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3060394525527954, "created_at": "2025-06-03T04:27:56.905833+00:00"} {"global_step": 231094, "acc_step": 0, "speed/wps": 5514.977426451986, "speed/FLOPS": 243733774035759.66, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044729698449373245, "optim/lr": 2.8047908822126155e-05, "optim/total_tokens": 1938556977152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2962532043457031, "created_at": "2025-06-03T04:27:59.881591+00:00"} {"global_step": 231095, "acc_step": 0, "speed/wps": 5513.653566649725, "speed/FLOPS": 243675266208628.47, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0513777881860733, "optim/lr": 2.804436159703161e-05, "optim/total_tokens": 1938565365760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2953563928604126, "created_at": "2025-06-03T04:28:02.856776+00:00"} {"global_step": 231096, "acc_step": 0, "speed/wps": 5514.432827202358, "speed/FLOPS": 243709705536437.75, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05200896039605141, "optim/lr": 2.8040814371937286e-05, "optim/total_tokens": 1938573754368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2971527576446533, "created_at": "2025-06-03T04:28:05.834958+00:00"} {"global_step": 231097, "acc_step": 0, "speed/wps": 5519.8087111745035, "speed/FLOPS": 243947292091738.03, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04571476951241493, "optim/lr": 2.8037267146842736e-05, "optim/total_tokens": 1938582142976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.304211974143982, "created_at": "2025-06-03T04:28:08.810405+00:00"} {"global_step": 231098, "acc_step": 0, "speed/wps": 5541.0560151718255, "speed/FLOPS": 244886314174859.03, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 189.76, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.06095404550433159, "optim/lr": 2.803371992174819e-05, "optim/total_tokens": 1938590531584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2759712934494019, "created_at": "2025-06-03T04:28:11.771700+00:00"} {"global_step": 231099, "acc_step": 0, "speed/wps": 5524.985844235398, "speed/FLOPS": 244176094874060.38, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04084466025233269, "optim/lr": 2.8030172696653643e-05, "optim/total_tokens": 1938598920192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2936193943023682, "created_at": "2025-06-03T04:28:14.742158+00:00"} {"global_step": 231100, "acc_step": 0, "speed/wps": 5514.707677723782, "speed/FLOPS": 243721852522672.2, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05033797398209572, "optim/lr": 2.802662547155932e-05, "optim/total_tokens": 1938607308800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2949427366256714, "created_at": "2025-06-03T04:28:17.716603+00:00"} {"global_step": 231101, "acc_step": 0, "speed/wps": 5517.673751804992, "speed/FLOPS": 243852937815318.28, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043112900108098984, "optim/lr": 2.8023078246464774e-05, "optim/total_tokens": 1938615697408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2988951206207275, "created_at": "2025-06-03T04:28:20.689732+00:00"} {"global_step": 231102, "acc_step": 0, "speed/wps": 5515.029259097944, "speed/FLOPS": 243736064773407.5, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04120735079050064, "optim/lr": 2.8019531021370224e-05, "optim/total_tokens": 1938624086016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.308847188949585, "created_at": "2025-06-03T04:28:23.664588+00:00"} {"global_step": 231103, "acc_step": 0, "speed/wps": 5507.579762857191, "speed/FLOPS": 243406835169544.53, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042479440569877625, "optim/lr": 2.8015983796275678e-05, "optim/total_tokens": 1938632474624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3049408197402954, "created_at": "2025-06-03T04:28:26.643829+00:00"} {"global_step": 231104, "acc_step": 0, "speed/wps": 5511.93722554857, "speed/FLOPS": 243599412716987.53, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.52 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.52, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04106597602367401, "optim/lr": 2.8012436571181355e-05, "optim/total_tokens": 1938640863232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2945939302444458, "created_at": "2025-06-03T04:28:29.624807+00:00"} {"global_step": 231105, "acc_step": 0, "speed/wps": 5522.920921341006, "speed/FLOPS": 244084835851361.72, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04118633642792702, "optim/lr": 2.800888934608681e-05, "optim/total_tokens": 1938649251840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2811076641082764, "created_at": "2025-06-03T04:28:32.599743+00:00"} {"global_step": 231106, "acc_step": 0, "speed/wps": 5526.65250628183, "speed/FLOPS": 244249752805762.97, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04079186171293259, "optim/lr": 2.8005342120992262e-05, "optim/total_tokens": 1938657640448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3109081983566284, "created_at": "2025-06-03T04:28:35.571504+00:00"} {"global_step": 231107, "acc_step": 0, "speed/wps": 5517.048121246722, "speed/FLOPS": 243825288146910.25, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041516926139593124, "optim/lr": 2.8001794895897713e-05, "optim/total_tokens": 1938666029056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3038866519927979, "created_at": "2025-06-03T04:28:38.545098+00:00"} {"global_step": 231108, "acc_step": 0, "speed/wps": 5525.342242487888, "speed/FLOPS": 244191845852608.8, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.040938399732112885, "optim/lr": 2.799824767080339e-05, "optim/total_tokens": 1938674417664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2982314825057983, "created_at": "2025-06-03T04:28:41.519232+00:00"} {"global_step": 231109, "acc_step": 0, "speed/wps": 5520.207275044208, "speed/FLOPS": 243964906574744.12, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04109116271138191, "optim/lr": 2.7994700445708843e-05, "optim/total_tokens": 1938682806272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2831242084503174, "created_at": "2025-06-03T04:28:44.492213+00:00"} {"global_step": 231110, "acc_step": 0, "speed/wps": 5522.152613750396, "speed/FLOPS": 244050880588411.53, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04312116280198097, "optim/lr": 2.7991153220614297e-05, "optim/total_tokens": 1938691194880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.292230248451233, "created_at": "2025-06-03T04:28:47.462750+00:00"} {"global_step": 231111, "acc_step": 0, "speed/wps": 5521.742408205494, "speed/FLOPS": 244032751602949.16, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04271441325545311, "optim/lr": 2.798760599551975e-05, "optim/total_tokens": 1938699583488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2955561876296997, "created_at": "2025-06-03T04:28:50.433744+00:00"} {"global_step": 231112, "acc_step": 0, "speed/wps": 5518.143984996885, "speed/FLOPS": 243873719715528.28, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0459866039454937, "optim/lr": 2.7984058770425424e-05, "optim/total_tokens": 1938707972096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2927275896072388, "created_at": "2025-06-03T04:28:53.407076+00:00"} {"global_step": 231113, "acc_step": 0, "speed/wps": 5528.620804144733, "speed/FLOPS": 244336741496641.5, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041289716958999634, "optim/lr": 2.7980511545330878e-05, "optim/total_tokens": 1938716360704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2812749147415161, "created_at": "2025-06-03T04:28:56.375227+00:00"} {"global_step": 231114, "acc_step": 0, "speed/wps": 5533.434828467145, "speed/FLOPS": 244549496731281.97, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04456368461251259, "optim/lr": 2.797696432023633e-05, "optim/total_tokens": 1938724749312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2981442213058472, "created_at": "2025-06-03T04:28:59.344667+00:00"} {"global_step": 231115, "acc_step": 0, "speed/wps": 5528.514578130112, "speed/FLOPS": 244332046850509.3, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04431904852390289, "optim/lr": 2.7973417095142005e-05, "optim/total_tokens": 1938733137920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2907716035842896, "created_at": "2025-06-03T04:29:02.316336+00:00"} {"global_step": 231116, "acc_step": 0, "speed/wps": 5518.532148521414, "speed/FLOPS": 243890874556511.44, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.051786184310913086, "optim/lr": 2.796986987004746e-05, "optim/total_tokens": 1938741526528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3043228387832642, "created_at": "2025-06-03T04:29:05.289068+00:00"} {"global_step": 231117, "acc_step": 0, "speed/wps": 5526.440542904461, "speed/FLOPS": 244240385109410.2, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0411730632185936, "optim/lr": 2.7966322644952913e-05, "optim/total_tokens": 1938749915136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3051620721817017, "created_at": "2025-06-03T04:29:08.257369+00:00"} {"global_step": 231118, "acc_step": 0, "speed/wps": 5509.647242430807, "speed/FLOPS": 243498207184378.56, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04562785476446152, "optim/lr": 2.7962775419858366e-05, "optim/total_tokens": 1938758303744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.298721432685852, "created_at": "2025-06-03T04:29:11.235567+00:00"} {"global_step": 231119, "acc_step": 0, "speed/wps": 5505.3784011568605, "speed/FLOPS": 243309546249980.53, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04331974312663078, "optim/lr": 2.795922819476404e-05, "optim/total_tokens": 1938766692352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3017070293426514, "created_at": "2025-06-03T04:29:14.215060+00:00"} {"global_step": 231120, "acc_step": 0, "speed/wps": 5506.422695615085, "speed/FLOPS": 243355698719850.47, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04166148975491524, "optim/lr": 2.7955680969669494e-05, "optim/total_tokens": 1938775080960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3113633394241333, "created_at": "2025-06-03T04:29:17.194634+00:00"} {"global_step": 231121, "acc_step": 0, "speed/wps": 5510.115176515893, "speed/FLOPS": 243518887475835.62, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.51 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.51, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04848632588982582, "optim/lr": 2.7952133744574947e-05, "optim/total_tokens": 1938783469568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3073292970657349, "created_at": "2025-06-03T04:29:20.174848+00:00"} {"global_step": 231122, "acc_step": 0, "speed/wps": 5524.369223824328, "speed/FLOPS": 244148843408040.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04393935203552246, "optim/lr": 2.79485865194804e-05, "optim/total_tokens": 1938791858176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2864280939102173, "created_at": "2025-06-03T04:29:23.144193+00:00"} {"global_step": 231123, "acc_step": 0, "speed/wps": 5520.823427948287, "speed/FLOPS": 243992137379347.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042483992874622345, "optim/lr": 2.7945039294386078e-05, "optim/total_tokens": 1938800246784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3015395402908325, "created_at": "2025-06-03T04:29:26.120275+00:00"} {"global_step": 231124, "acc_step": 0, "speed/wps": 5520.875030086442, "speed/FLOPS": 243994417929730.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04158303514122963, "optim/lr": 2.794149206929153e-05, "optim/total_tokens": 1938808635392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2909036874771118, "created_at": "2025-06-03T04:29:29.092570+00:00"} {"global_step": 231125, "acc_step": 0, "speed/wps": 5511.281437624445, "speed/FLOPS": 243570430247368.12, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0427459292113781, "optim/lr": 2.7937944844196982e-05, "optim/total_tokens": 1938817024000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3049613237380981, "created_at": "2025-06-03T04:29:32.072607+00:00"} {"global_step": 231126, "acc_step": 0, "speed/wps": 5523.385870511777, "speed/FLOPS": 244105384224884.22, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04265449941158295, "optim/lr": 2.7934397619102436e-05, "optim/total_tokens": 1938825412608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3059592247009277, "created_at": "2025-06-03T04:29:35.044076+00:00"} {"global_step": 231127, "acc_step": 0, "speed/wps": 5516.459025132534, "speed/FLOPS": 243799253113930.4, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041565656661987305, "optim/lr": 2.7930850394008113e-05, "optim/total_tokens": 1938833801216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2991859912872314, "created_at": "2025-06-03T04:29:38.017635+00:00"} {"global_step": 231128, "acc_step": 0, "speed/wps": 5510.232069548866, "speed/FLOPS": 243524053549580.25, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.5 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.5, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0411987379193306, "optim/lr": 2.7927303168913566e-05, "optim/total_tokens": 1938842189824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3086950778961182, "created_at": "2025-06-03T04:29:40.994915+00:00"} {"global_step": 231129, "acc_step": 0, "speed/wps": 5513.994613726589, "speed/FLOPS": 243690338743788.66, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04473159834742546, "optim/lr": 2.7923755943819017e-05, "optim/total_tokens": 1938850578432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2942644357681274, "created_at": "2025-06-03T04:29:43.971630+00:00"} {"global_step": 231130, "acc_step": 0, "speed/wps": 5521.7812874708925, "speed/FLOPS": 244034469867477.66, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041466452181339264, "optim/lr": 2.792020871872447e-05, "optim/total_tokens": 1938858967040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3019617795944214, "created_at": "2025-06-03T04:29:46.942734+00:00"} {"global_step": 231131, "acc_step": 0, "speed/wps": 5515.239640400058, "speed/FLOPS": 243745362550131.8, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04380938783288002, "optim/lr": 2.7916661493630147e-05, "optim/total_tokens": 1938867355648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3039742708206177, "created_at": "2025-06-03T04:29:49.919593+00:00"} {"global_step": 231132, "acc_step": 0, "speed/wps": 5533.700695234879, "speed/FLOPS": 244561246681586.34, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04820435494184494, "optim/lr": 2.79131142685356e-05, "optim/total_tokens": 1938875744256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3146777153015137, "created_at": "2025-06-03T04:29:52.885445+00:00"} {"global_step": 231133, "acc_step": 0, "speed/wps": 5536.195926270869, "speed/FLOPS": 244671523121626.84, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 189.9, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04281610623002052, "optim/lr": 2.7909567043441055e-05, "optim/total_tokens": 1938884132864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2964454889297485, "created_at": "2025-06-03T04:29:55.849202+00:00"} {"global_step": 231134, "acc_step": 0, "speed/wps": 5515.9801075881605, "speed/FLOPS": 243778087409791.28, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04492631182074547, "optim/lr": 2.7906019818346505e-05, "optim/total_tokens": 1938892521472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2965013980865479, "created_at": "2025-06-03T04:29:58.823483+00:00"} {"global_step": 231135, "acc_step": 0, "speed/wps": 5518.51333779544, "speed/FLOPS": 243890043218705.4, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04064134135842323, "optim/lr": 2.7902472593252182e-05, "optim/total_tokens": 1938900910080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2910481691360474, "created_at": "2025-06-03T04:30:01.799043+00:00"} {"global_step": 231136, "acc_step": 0, "speed/wps": 5518.590033043533, "speed/FLOPS": 243893432756109.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042962852865457535, "optim/lr": 2.7898925368157636e-05, "optim/total_tokens": 1938909298688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3135261535644531, "created_at": "2025-06-03T04:30:04.775468+00:00"} {"global_step": 231137, "acc_step": 0, "speed/wps": 5511.620089367127, "speed/FLOPS": 243585396921017.9, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04276517406105995, "optim/lr": 2.789537814306309e-05, "optim/total_tokens": 1938917687296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.293592095375061, "created_at": "2025-06-03T04:30:07.756197+00:00"} {"global_step": 231138, "acc_step": 0, "speed/wps": 5512.127693168729, "speed/FLOPS": 243607830410896.94, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041216228157281876, "optim/lr": 2.7891830917968543e-05, "optim/total_tokens": 1938926075904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.302176594734192, "created_at": "2025-06-03T04:30:10.732097+00:00"} {"global_step": 231139, "acc_step": 0, "speed/wps": 5535.379959594148, "speed/FLOPS": 244635461571011.84, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04799744486808777, "optim/lr": 2.7888283692874217e-05, "optim/total_tokens": 1938934464512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.295814037322998, "created_at": "2025-06-03T04:30:13.699356+00:00"} {"global_step": 231140, "acc_step": 0, "speed/wps": 5540.831596441969, "speed/FLOPS": 244876396015678.56, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 189.73, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.040895819664001465, "optim/lr": 2.788473646777967e-05, "optim/total_tokens": 1938942853120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.295112133026123, "created_at": "2025-06-03T04:30:16.663575+00:00"} {"global_step": 231141, "acc_step": 0, "speed/wps": 5516.365721502172, "speed/FLOPS": 243795129571039.66, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04684389755129814, "optim/lr": 2.7881189242685124e-05, "optim/total_tokens": 1938951241728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3045014142990112, "created_at": "2025-06-03T04:30:19.638851+00:00"} {"global_step": 231142, "acc_step": 0, "speed/wps": 5519.982968345466, "speed/FLOPS": 243954993366765.53, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041279636323451996, "optim/lr": 2.7877642017590798e-05, "optim/total_tokens": 1938959630336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3099385499954224, "created_at": "2025-06-03T04:30:22.611808+00:00"} {"global_step": 231143, "acc_step": 0, "speed/wps": 5514.98420241723, "speed/FLOPS": 243734073498740.94, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.050314001739025116, "optim/lr": 2.787409479249625e-05, "optim/total_tokens": 1938968018944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.302520990371704, "created_at": "2025-06-03T04:30:25.586885+00:00"} {"global_step": 231144, "acc_step": 0, "speed/wps": 5518.06688544915, "speed/FLOPS": 243870312310149.66, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04498856142163277, "optim/lr": 2.7870547567401705e-05, "optim/total_tokens": 1938976407552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3002177476882935, "created_at": "2025-06-03T04:30:28.560052+00:00"} {"global_step": 231145, "acc_step": 0, "speed/wps": 5504.580924938438, "speed/FLOPS": 243274301882979.6, "speed/curr_iter_time": 2.9756, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9756, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045386701822280884, "optim/lr": 2.786700034230716e-05, "optim/total_tokens": 1938984796160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2894805669784546, "created_at": "2025-06-03T04:30:31.544744+00:00"} {"global_step": 231146, "acc_step": 0, "speed/wps": 5503.242382474493, "speed/FLOPS": 243215145157354.62, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.49 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.49, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04859783127903938, "optim/lr": 2.7863453117212832e-05, "optim/total_tokens": 1938993184768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2995549440383911, "created_at": "2025-06-03T04:30:34.526437+00:00"} {"global_step": 231147, "acc_step": 0, "speed/wps": 5524.174417407272, "speed/FLOPS": 244140233961516.2, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04213744029402733, "optim/lr": 2.7859905892118286e-05, "optim/total_tokens": 1939001573376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.294518232345581, "created_at": "2025-06-03T04:30:37.495952+00:00"} {"global_step": 231148, "acc_step": 0, "speed/wps": 5525.594181392565, "speed/FLOPS": 244202980262655.28, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.33, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04384112358093262, "optim/lr": 2.785635866702374e-05, "optim/total_tokens": 1939009961984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2948492765426636, "created_at": "2025-06-03T04:30:40.464628+00:00"} {"global_step": 231149, "acc_step": 0, "speed/wps": 5526.267780855002, "speed/FLOPS": 244232749911100.4, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042218420654535294, "optim/lr": 2.7852811441929193e-05, "optim/total_tokens": 1939018350592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.30195152759552, "created_at": "2025-06-03T04:30:43.434323+00:00"} {"global_step": 231150, "acc_step": 0, "speed/wps": 5512.033411690053, "speed/FLOPS": 243603663652115.8, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043076686561107635, "optim/lr": 2.7849264216834867e-05, "optim/total_tokens": 1939026739200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.302255392074585, "created_at": "2025-06-03T04:30:46.415579+00:00"} {"global_step": 231151, "acc_step": 0, "speed/wps": 5521.736886875126, "speed/FLOPS": 244032507588407.66, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04368799552321434, "optim/lr": 2.784571699174032e-05, "optim/total_tokens": 1939035127808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2995730638504028, "created_at": "2025-06-03T04:30:49.386614+00:00"} {"global_step": 231152, "acc_step": 0, "speed/wps": 5509.277363933425, "speed/FLOPS": 243481860448004.06, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05017376318573952, "optim/lr": 2.7842169766645774e-05, "optim/total_tokens": 1939043516416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3045908212661743, "created_at": "2025-06-03T04:30:52.364141+00:00"} {"global_step": 231153, "acc_step": 0, "speed/wps": 5506.854227665221, "speed/FLOPS": 243374770227685.2, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04165153577923775, "optim/lr": 2.7838622541551228e-05, "optim/total_tokens": 1939051905024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3094921112060547, "created_at": "2025-06-03T04:30:55.347449+00:00"} {"global_step": 231154, "acc_step": 0, "speed/wps": 5506.569696975601, "speed/FLOPS": 243362195427564.1, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.48 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.48, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04209339991211891, "optim/lr": 2.7835075316456905e-05, "optim/total_tokens": 1939060293632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2984522581100464, "created_at": "2025-06-03T04:30:58.327181+00:00"} {"global_step": 231155, "acc_step": 0, "speed/wps": 5521.545849492449, "speed/FLOPS": 244024064713911.25, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04195516183972359, "optim/lr": 2.7831528091362355e-05, "optim/total_tokens": 1939068682240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.28952956199646, "created_at": "2025-06-03T04:31:01.299879+00:00"} {"global_step": 231156, "acc_step": 0, "speed/wps": 5523.212115462376, "speed/FLOPS": 244097705141059.66, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04089980944991112, "optim/lr": 2.782798086626781e-05, "optim/total_tokens": 1939077070848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2815240621566772, "created_at": "2025-06-03T04:31:04.270421+00:00"} {"global_step": 231157, "acc_step": 0, "speed/wps": 5529.530367732129, "speed/FLOPS": 244376939551635.97, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.049350202083587646, "optim/lr": 2.7824433641173263e-05, "optim/total_tokens": 1939085459456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.308902621269226, "created_at": "2025-06-03T04:31:07.240690+00:00"} {"global_step": 231158, "acc_step": 0, "speed/wps": 5524.173275566009, "speed/FLOPS": 244140183497976.84, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04505976289510727, "optim/lr": 2.782088641607894e-05, "optim/total_tokens": 1939093848064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2996585369110107, "created_at": "2025-06-03T04:31:10.211091+00:00"} {"global_step": 231159, "acc_step": 0, "speed/wps": 5534.143480288782, "speed/FLOPS": 244580815514589.44, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.04, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04180415719747543, "optim/lr": 2.7817339190984393e-05, "optim/total_tokens": 1939102236672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2899494171142578, "created_at": "2025-06-03T04:31:13.175425+00:00"} {"global_step": 231160, "acc_step": 0, "speed/wps": 5528.731015343285, "speed/FLOPS": 244341612267505.5, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04312875494360924, "optim/lr": 2.7813791965889844e-05, "optim/total_tokens": 1939110625280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.3212401866912842, "created_at": "2025-06-03T04:31:16.146476+00:00"} {"global_step": 231161, "acc_step": 0, "speed/wps": 5516.87345633553, "speed/FLOPS": 243817568851851.62, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041117679327726364, "optim/lr": 2.7810244740795297e-05, "optim/total_tokens": 1939119013888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3037487268447876, "created_at": "2025-06-03T04:31:19.120777+00:00"} {"global_step": 231162, "acc_step": 0, "speed/wps": 5511.894305541399, "speed/FLOPS": 243597515872355.12, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0413089245557785, "optim/lr": 2.7806697515700974e-05, "optim/total_tokens": 1939127402496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2972444295883179, "created_at": "2025-06-03T04:31:22.097864+00:00"} {"global_step": 231163, "acc_step": 0, "speed/wps": 5519.235614154525, "speed/FLOPS": 243921964136831.44, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042602624744176865, "optim/lr": 2.7803150290606428e-05, "optim/total_tokens": 1939135791104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3088456392288208, "created_at": "2025-06-03T04:31:25.069782+00:00"} {"global_step": 231164, "acc_step": 0, "speed/wps": 5526.520667465757, "speed/FLOPS": 244243926204904.75, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.25, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044149719178676605, "optim/lr": 2.779960306551188e-05, "optim/total_tokens": 1939144179712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2947591543197632, "created_at": "2025-06-03T04:31:28.038115+00:00"} {"global_step": 231165, "acc_step": 0, "speed/wps": 5535.673090448941, "speed/FLOPS": 244648416454413.97, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05042703449726105, "optim/lr": 2.7796055840417332e-05, "optim/total_tokens": 1939152568320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3039088249206543, "created_at": "2025-06-03T04:31:31.002400+00:00"} {"global_step": 231166, "acc_step": 0, "speed/wps": 5524.890934560366, "speed/FLOPS": 244171900352215.72, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04321703314781189, "optim/lr": 2.779250861532301e-05, "optim/total_tokens": 1939160956928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3036463260650635, "created_at": "2025-06-03T04:31:33.971347+00:00"} {"global_step": 231167, "acc_step": 0, "speed/wps": 5529.327649010045, "speed/FLOPS": 244367980421728.34, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04284733161330223, "optim/lr": 2.7788961390228463e-05, "optim/total_tokens": 1939169345536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3079700469970703, "created_at": "2025-06-03T04:31:36.940850+00:00"} {"global_step": 231168, "acc_step": 0, "speed/wps": 5521.924192789512, "speed/FLOPS": 244040785551104.9, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042275041341781616, "optim/lr": 2.7785414165133916e-05, "optim/total_tokens": 1939177734144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.293927550315857, "created_at": "2025-06-03T04:31:39.914887+00:00"} {"global_step": 231169, "acc_step": 0, "speed/wps": 5522.741519198193, "speed/FLOPS": 244076907194912.78, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04369381442666054, "optim/lr": 2.778186694003959e-05, "optim/total_tokens": 1939186122752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3061208724975586, "created_at": "2025-06-03T04:31:42.884936+00:00"} {"global_step": 231170, "acc_step": 0, "speed/wps": 5504.917271414943, "speed/FLOPS": 243289166675663.75, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.47 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.47, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04181878641247749, "optim/lr": 2.7778319714945044e-05, "optim/total_tokens": 1939194511360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.290138840675354, "created_at": "2025-06-03T04:31:45.867458+00:00"} {"global_step": 231171, "acc_step": 0, "speed/wps": 5514.77947291938, "speed/FLOPS": 243725025502836.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04200715571641922, "optim/lr": 2.7774772489850497e-05, "optim/total_tokens": 1939202899968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2815239429473877, "created_at": "2025-06-03T04:31:48.841983+00:00"} {"global_step": 231172, "acc_step": 0, "speed/wps": 5524.5114082698765, "speed/FLOPS": 244155127232767.72, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04212355241179466, "optim/lr": 2.777122526475595e-05, "optim/total_tokens": 1939211288576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3057602643966675, "created_at": "2025-06-03T04:31:51.811044+00:00"} {"global_step": 231173, "acc_step": 0, "speed/wps": 5531.661661040922, "speed/FLOPS": 244471131806936.53, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.14, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04152775555849075, "optim/lr": 2.7767678039661625e-05, "optim/total_tokens": 1939219677184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3058375120162964, "created_at": "2025-06-03T04:31:54.782570+00:00"} {"global_step": 231174, "acc_step": 0, "speed/wps": 5516.258303658578, "speed/FLOPS": 243790382252167.2, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04227691888809204, "optim/lr": 2.776413081456708e-05, "optim/total_tokens": 1939228065792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2849611043930054, "created_at": "2025-06-03T04:31:57.760366+00:00"} {"global_step": 231175, "acc_step": 0, "speed/wps": 5520.533378677923, "speed/FLOPS": 243979318686204.62, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04297519475221634, "optim/lr": 2.7760583589472532e-05, "optim/total_tokens": 1939236454400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2993032932281494, "created_at": "2025-06-03T04:32:00.731981+00:00"} {"global_step": 231176, "acc_step": 0, "speed/wps": 5535.364441464865, "speed/FLOPS": 244634775749126.53, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042119428515434265, "optim/lr": 2.7757036364377986e-05, "optim/total_tokens": 1939244843008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3071781396865845, "created_at": "2025-06-03T04:32:03.701486+00:00"} {"global_step": 231177, "acc_step": 0, "speed/wps": 5526.5732373012925, "speed/FLOPS": 244246249522558.62, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04324263334274292, "optim/lr": 2.775348913928366e-05, "optim/total_tokens": 1939253231616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.306818962097168, "created_at": "2025-06-03T04:32:06.674675+00:00"} {"global_step": 231178, "acc_step": 0, "speed/wps": 5520.428614334171, "speed/FLOPS": 243974688638443.3, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04209088161587715, "optim/lr": 2.7749941914189113e-05, "optim/total_tokens": 1939261620224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3138729333877563, "created_at": "2025-06-03T04:32:09.647781+00:00"} {"global_step": 231179, "acc_step": 0, "speed/wps": 5522.642071500427, "speed/FLOPS": 244072512115691.0, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042541224509477615, "optim/lr": 2.7746394689094567e-05, "optim/total_tokens": 1939270008832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3191057443618774, "created_at": "2025-06-03T04:32:12.621780+00:00"} {"global_step": 231180, "acc_step": 0, "speed/wps": 5505.213857006538, "speed/FLOPS": 243302274240749.6, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.46 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.46, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046909794211387634, "optim/lr": 2.774284746400002e-05, "optim/total_tokens": 1939278397440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3041423559188843, "created_at": "2025-06-03T04:32:15.601752+00:00"} {"global_step": 231181, "acc_step": 0, "speed/wps": 5529.619793308894, "speed/FLOPS": 244380891704407.38, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04477845877408981, "optim/lr": 2.7739300238905698e-05, "optim/total_tokens": 1939286786048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2800476551055908, "created_at": "2025-06-03T04:32:18.569274+00:00"} {"global_step": 231182, "acc_step": 0, "speed/wps": 5522.60763132845, "speed/FLOPS": 244070990036370.4, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.047625232487916946, "optim/lr": 2.7735753013811148e-05, "optim/total_tokens": 1939295174656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3014521598815918, "created_at": "2025-06-03T04:32:21.540571+00:00"} {"global_step": 231183, "acc_step": 0, "speed/wps": 5530.672842469479, "speed/FLOPS": 244427431087311.03, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04275396093726158, "optim/lr": 2.77322057887166e-05, "optim/total_tokens": 1939303563264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2954168319702148, "created_at": "2025-06-03T04:32:24.510786+00:00"} {"global_step": 231184, "acc_step": 0, "speed/wps": 5521.607792800077, "speed/FLOPS": 244026802291053.84, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.055657438933849335, "optim/lr": 2.7728658563622055e-05, "optim/total_tokens": 1939311951872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3167297840118408, "created_at": "2025-06-03T04:32:27.482149+00:00"} {"global_step": 231185, "acc_step": 0, "speed/wps": 5528.206445012897, "speed/FLOPS": 244318428943896.7, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04205199331045151, "optim/lr": 2.7725111338527732e-05, "optim/total_tokens": 1939320340480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2881439924240112, "created_at": "2025-06-03T04:32:30.455605+00:00"} {"global_step": 231186, "acc_step": 0, "speed/wps": 5520.883182371717, "speed/FLOPS": 243994778219012.72, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.051097627729177475, "optim/lr": 2.7721564113433186e-05, "optim/total_tokens": 1939328729088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3013370037078857, "created_at": "2025-06-03T04:32:33.427123+00:00"} {"global_step": 231187, "acc_step": 0, "speed/wps": 5519.848332630918, "speed/FLOPS": 243949043157310.53, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04414801672101021, "optim/lr": 2.7718016888338636e-05, "optim/total_tokens": 1939337117696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.293432354927063, "created_at": "2025-06-03T04:32:36.400502+00:00"} {"global_step": 231188, "acc_step": 0, "speed/wps": 5514.938467460201, "speed/FLOPS": 243732052247732.97, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.047640610486269, "optim/lr": 2.771446966324409e-05, "optim/total_tokens": 1939345506304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2994775772094727, "created_at": "2025-06-03T04:32:39.380808+00:00"} {"global_step": 231189, "acc_step": 0, "speed/wps": 5521.666462393193, "speed/FLOPS": 244029395186771.34, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.057483822107315063, "optim/lr": 2.7710922438149767e-05, "optim/total_tokens": 1939353894912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3130549192428589, "created_at": "2025-06-03T04:32:42.352358+00:00"} {"global_step": 231190, "acc_step": 0, "speed/wps": 5521.541988777786, "speed/FLOPS": 244023894090084.1, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04650917649269104, "optim/lr": 2.770737521305522e-05, "optim/total_tokens": 1939362283520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2884186506271362, "created_at": "2025-06-03T04:32:45.328221+00:00"} {"global_step": 231191, "acc_step": 0, "speed/wps": 5533.3042900991795, "speed/FLOPS": 244543727603573.8, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.03, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04287547990679741, "optim/lr": 2.7703827987960674e-05, "optim/total_tokens": 1939370672128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.303632378578186, "created_at": "2025-06-03T04:32:48.296467+00:00"} {"global_step": 231192, "acc_step": 0, "speed/wps": 5533.695064236987, "speed/FLOPS": 244560997820301.53, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.08, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0521051324903965, "optim/lr": 2.7700280762866124e-05, "optim/total_tokens": 1939379060736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3100757598876953, "created_at": "2025-06-03T04:32:51.264672+00:00"} {"global_step": 231193, "acc_step": 0, "speed/wps": 5517.802751118407, "speed/FLOPS": 243858638924692.9, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04666749760508537, "optim/lr": 2.76967335377718e-05, "optim/total_tokens": 1939387449344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2977758646011353, "created_at": "2025-06-03T04:32:54.242041+00:00"} {"global_step": 231194, "acc_step": 0, "speed/wps": 5518.071457437196, "speed/FLOPS": 243870514368619.75, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04826502874493599, "optim/lr": 2.7693186312677255e-05, "optim/total_tokens": 1939395837952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2848293781280518, "created_at": "2025-06-03T04:32:57.219012+00:00"} {"global_step": 231195, "acc_step": 0, "speed/wps": 5519.776427910434, "speed/FLOPS": 243945865336706.88, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045794907957315445, "optim/lr": 2.768963908758271e-05, "optim/total_tokens": 1939404226560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3011163473129272, "created_at": "2025-06-03T04:33:00.191594+00:00"} {"global_step": 231196, "acc_step": 0, "speed/wps": 5504.660372106538, "speed/FLOPS": 243277813041162.1, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05556059628725052, "optim/lr": 2.7686091862488383e-05, "optim/total_tokens": 1939412615168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2997559309005737, "created_at": "2025-06-03T04:33:03.176924+00:00"} {"global_step": 231197, "acc_step": 0, "speed/wps": 5516.7212364017005, "speed/FLOPS": 243810841509908.6, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05401431396603584, "optim/lr": 2.7682544637393836e-05, "optim/total_tokens": 1939421003776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2997785806655884, "created_at": "2025-06-03T04:33:06.156270+00:00"} {"global_step": 231198, "acc_step": 0, "speed/wps": 5524.992948472479, "speed/FLOPS": 244176408844976.56, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04680134356021881, "optim/lr": 2.767899741229929e-05, "optim/total_tokens": 1939429392384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3017505407333374, "created_at": "2025-06-03T04:33:09.130225+00:00"} {"global_step": 231199, "acc_step": 0, "speed/wps": 5520.687592640764, "speed/FLOPS": 243986134154023.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04944014549255371, "optim/lr": 2.7675450187204743e-05, "optim/total_tokens": 1939437780992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.297918677330017, "created_at": "2025-06-03T04:33:12.106573+00:00"} {"global_step": 231200, "acc_step": 0, "speed/wps": 5519.398555923686, "speed/FLOPS": 243929165329016.78, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04985664039850235, "optim/lr": 2.7671902962110417e-05, "optim/total_tokens": 1939446169600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2970927953720093, "created_at": "2025-06-03T04:33:15.084996+00:00"} {"global_step": 231201, "acc_step": 0, "speed/wps": 5503.021600203751, "speed/FLOPS": 243205387711053.94, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.45 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.45, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04802443087100983, "optim/lr": 2.766835573701587e-05, "optim/total_tokens": 1939454558208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.29246187210083, "created_at": "2025-06-03T04:33:18.067206+00:00"} {"global_step": 231202, "acc_step": 0, "speed/wps": 5517.3872251080975, "speed/FLOPS": 243840274801892.12, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05006030946969986, "optim/lr": 2.7664808511921324e-05, "optim/total_tokens": 1939462946816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3080631494522095, "created_at": "2025-06-03T04:33:21.043483+00:00"} {"global_step": 231203, "acc_step": 0, "speed/wps": 5516.3247454801085, "speed/FLOPS": 243793318640598.75, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04540364071726799, "optim/lr": 2.7661261286826778e-05, "optim/total_tokens": 1939471335424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2992242574691772, "created_at": "2025-06-03T04:33:24.017042+00:00"} {"global_step": 231204, "acc_step": 0, "speed/wps": 5517.22825718297, "speed/FLOPS": 243833249233273.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04455955699086189, "optim/lr": 2.7657714061732452e-05, "optim/total_tokens": 1939479724032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3085212707519531, "created_at": "2025-06-03T04:33:26.990504+00:00"} {"global_step": 231205, "acc_step": 0, "speed/wps": 5507.143689471021, "speed/FLOPS": 243387562957901.75, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04202793911099434, "optim/lr": 2.7654166836637905e-05, "optim/total_tokens": 1939488112640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2935515642166138, "created_at": "2025-06-03T04:33:29.973743+00:00"} {"global_step": 231206, "acc_step": 0, "speed/wps": 5512.109644981033, "speed/FLOPS": 243607032773379.78, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05236447602510452, "optim/lr": 2.765061961154336e-05, "optim/total_tokens": 1939496501248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2970497608184814, "created_at": "2025-06-03T04:33:32.954582+00:00"} {"global_step": 231207, "acc_step": 0, "speed/wps": 5519.329684164972, "speed/FLOPS": 243926121549799.22, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04208311811089516, "optim/lr": 2.7647072386448813e-05, "optim/total_tokens": 1939504889856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2977006435394287, "created_at": "2025-06-03T04:33:35.927504+00:00"} {"global_step": 231208, "acc_step": 0, "speed/wps": 5520.863877421478, "speed/FLOPS": 243993925039023.84, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05051649361848831, "optim/lr": 2.7643525161354486e-05, "optim/total_tokens": 1939513278464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3059784173965454, "created_at": "2025-06-03T04:33:38.901878+00:00"} {"global_step": 231209, "acc_step": 0, "speed/wps": 5518.472755275658, "speed/FLOPS": 243888249679051.22, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04994343966245651, "optim/lr": 2.763997793625994e-05, "optim/total_tokens": 1939521667072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3046839237213135, "created_at": "2025-06-03T04:33:41.874398+00:00"} {"global_step": 231210, "acc_step": 0, "speed/wps": 5511.4029928898, "speed/FLOPS": 243575802367920.56, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04446369409561157, "optim/lr": 2.7636430711165394e-05, "optim/total_tokens": 1939530055680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3076810836791992, "created_at": "2025-06-03T04:33:44.855064+00:00"} {"global_step": 231211, "acc_step": 0, "speed/wps": 5510.587630582545, "speed/FLOPS": 243539767527342.5, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04234464839100838, "optim/lr": 2.7632883486070847e-05, "optim/total_tokens": 1939538444288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2896136045455933, "created_at": "2025-06-03T04:33:47.835509+00:00"} {"global_step": 231212, "acc_step": 0, "speed/wps": 5521.863308740753, "speed/FLOPS": 244038094787782.6, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04728858917951584, "optim/lr": 2.7629336260976525e-05, "optim/total_tokens": 1939546832896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.300681233406067, "created_at": "2025-06-03T04:33:50.807072+00:00"} {"global_step": 231213, "acc_step": 0, "speed/wps": 5517.051909067232, "speed/FLOPS": 243825455549188.97, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042323049157857895, "optim/lr": 2.7625789035881975e-05, "optim/total_tokens": 1939555221504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2912293672561646, "created_at": "2025-06-03T04:33:53.785980+00:00"} {"global_step": 231214, "acc_step": 0, "speed/wps": 5535.137869008664, "speed/FLOPS": 244624762406265.38, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 189.99, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043370552361011505, "optim/lr": 2.762224181078743e-05, "optim/total_tokens": 1939563610112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.29463529586792, "created_at": "2025-06-03T04:33:56.754078+00:00"} {"global_step": 231215, "acc_step": 0, "speed/wps": 5528.76631426193, "speed/FLOPS": 244343172299033.34, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04365641251206398, "optim/lr": 2.7618694585692882e-05, "optim/total_tokens": 1939571998720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2893561124801636, "created_at": "2025-06-03T04:33:59.727258+00:00"} {"global_step": 231216, "acc_step": 0, "speed/wps": 5507.527053713494, "speed/FLOPS": 243404505695182.97, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.43 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.43, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04286538064479828, "optim/lr": 2.761514736059856e-05, "optim/total_tokens": 1939580387328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3084657192230225, "created_at": "2025-06-03T04:34:02.708950+00:00"} {"global_step": 231217, "acc_step": 0, "speed/wps": 5526.361718787304, "speed/FLOPS": 244236901486890.25, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044299714267253876, "optim/lr": 2.7611600135504013e-05, "optim/total_tokens": 1939588775936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2922981977462769, "created_at": "2025-06-03T04:34:05.680112+00:00"} {"global_step": 231218, "acc_step": 0, "speed/wps": 5528.505649701607, "speed/FLOPS": 244331652259669.22, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04295350983738899, "optim/lr": 2.7608052910409463e-05, "optim/total_tokens": 1939597164544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.31006920337677, "created_at": "2025-06-03T04:34:08.648231+00:00"} {"global_step": 231219, "acc_step": 0, "speed/wps": 5540.171581812522, "speed/FLOPS": 244847226747318.16, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041503578424453735, "optim/lr": 2.7604505685314917e-05, "optim/total_tokens": 1939605553152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2906498908996582, "created_at": "2025-06-03T04:34:11.612058+00:00"} {"global_step": 231220, "acc_step": 0, "speed/wps": 5522.794149363217, "speed/FLOPS": 244079233178821.25, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04202534630894661, "optim/lr": 2.7600958460220594e-05, "optim/total_tokens": 1939613941760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3061858415603638, "created_at": "2025-06-03T04:34:14.586487+00:00"} {"global_step": 231221, "acc_step": 0, "speed/wps": 5495.127054745448, "speed/FLOPS": 242856489209743.66, "speed/curr_iter_time": 2.9798, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9798, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.44 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.44, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04395192489027977, "optim/lr": 2.7597411235126047e-05, "optim/total_tokens": 1939622330368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2776069641113281, "created_at": "2025-06-03T04:34:17.574546+00:00"} {"global_step": 231222, "acc_step": 0, "speed/wps": 5515.194376256524, "speed/FLOPS": 243743362106670.5, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04196504130959511, "optim/lr": 2.75938640100315e-05, "optim/total_tokens": 1939630718976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2891885042190552, "created_at": "2025-06-03T04:34:20.548678+00:00"} {"global_step": 231223, "acc_step": 0, "speed/wps": 5529.55606893573, "speed/FLOPS": 244378075413284.44, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04251372069120407, "optim/lr": 2.7590316784936955e-05, "optim/total_tokens": 1939639107584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.288063883781433, "created_at": "2025-06-03T04:34:23.515442+00:00"} {"global_step": 231224, "acc_step": 0, "speed/wps": 5523.737529542909, "speed/FLOPS": 244120925754106.2, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04166066646575928, "optim/lr": 2.758676955984263e-05, "optim/total_tokens": 1939647496192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3105217218399048, "created_at": "2025-06-03T04:34:26.488317+00:00"} {"global_step": 231225, "acc_step": 0, "speed/wps": 5519.425487331105, "speed/FLOPS": 243930355559377.25, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04369696229696274, "optim/lr": 2.7583222334748082e-05, "optim/total_tokens": 1939655884800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.312993049621582, "created_at": "2025-06-03T04:34:29.463652+00:00"} {"global_step": 231226, "acc_step": 0, "speed/wps": 5517.135497212882, "speed/FLOPS": 243829149717383.78, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041273605078458786, "optim/lr": 2.7579675109653536e-05, "optim/total_tokens": 1939664273408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2911890745162964, "created_at": "2025-06-03T04:34:32.437416+00:00"} {"global_step": 231227, "acc_step": 0, "speed/wps": 5516.159676517656, "speed/FLOPS": 243786023437357.9, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04425928369164467, "optim/lr": 2.757612788455921e-05, "optim/total_tokens": 1939672662016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2963486909866333, "created_at": "2025-06-03T04:34:35.411988+00:00"} {"global_step": 231228, "acc_step": 0, "speed/wps": 5514.378650662982, "speed/FLOPS": 243707311210698.03, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04468801990151405, "optim/lr": 2.7572580659464663e-05, "optim/total_tokens": 1939681050624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2926443815231323, "created_at": "2025-06-03T04:34:38.390995+00:00"} {"global_step": 231229, "acc_step": 0, "speed/wps": 5514.587513843865, "speed/FLOPS": 243716541894234.38, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04188406467437744, "optim/lr": 2.7569033434370117e-05, "optim/total_tokens": 1939689439232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.289510726928711, "created_at": "2025-06-03T04:34:41.366255+00:00"} {"global_step": 231230, "acc_step": 0, "speed/wps": 5520.179581220593, "speed/FLOPS": 243963682649490.2, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043623216450214386, "optim/lr": 2.756548620927557e-05, "optim/total_tokens": 1939697827840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.297088384628296, "created_at": "2025-06-03T04:34:44.342796+00:00"} {"global_step": 231231, "acc_step": 0, "speed/wps": 5529.925497015482, "speed/FLOPS": 244394402243505.12, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04729413986206055, "optim/lr": 2.7561938984181244e-05, "optim/total_tokens": 1939706216448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2930353879928589, "created_at": "2025-06-03T04:34:47.313427+00:00"} {"global_step": 231232, "acc_step": 0, "speed/wps": 5525.140229404549, "speed/FLOPS": 244182917908321.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04603038728237152, "optim/lr": 2.7558391759086698e-05, "optim/total_tokens": 1939714605056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3053358793258667, "created_at": "2025-06-03T04:34:50.284119+00:00"} {"global_step": 231233, "acc_step": 0, "speed/wps": 5520.2308530342525, "speed/FLOPS": 243965948601221.0, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04269307106733322, "optim/lr": 2.755484453399215e-05, "optim/total_tokens": 1939722993664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2918508052825928, "created_at": "2025-06-03T04:34:53.256256+00:00"} {"global_step": 231234, "acc_step": 0, "speed/wps": 5522.722714873263, "speed/FLOPS": 244076076140000.16, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04412953183054924, "optim/lr": 2.7551297308897605e-05, "optim/total_tokens": 1939731382272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3030776977539062, "created_at": "2025-06-03T04:34:56.226418+00:00"} {"global_step": 231235, "acc_step": 0, "speed/wps": 5507.937910697627, "speed/FLOPS": 243422663470924.97, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04296892508864403, "optim/lr": 2.754775008380328e-05, "optim/total_tokens": 1939739770880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2911375761032104, "created_at": "2025-06-03T04:34:59.208573+00:00"} {"global_step": 231236, "acc_step": 0, "speed/wps": 5510.494087896934, "speed/FLOPS": 243535633419433.34, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045909419655799866, "optim/lr": 2.7544202858708732e-05, "optim/total_tokens": 1939748159488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.298906922340393, "created_at": "2025-06-03T04:35:02.185312+00:00"} {"global_step": 231237, "acc_step": 0, "speed/wps": 5516.864848334931, "speed/FLOPS": 243817188422284.88, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04272529110312462, "optim/lr": 2.7540655633614186e-05, "optim/total_tokens": 1939756548096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2976195812225342, "created_at": "2025-06-03T04:35:05.164769+00:00"} {"global_step": 231238, "acc_step": 0, "speed/wps": 5513.326464486919, "speed/FLOPS": 243660809967293.1, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04376458749175072, "optim/lr": 2.753710840851964e-05, "optim/total_tokens": 1939764936704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.305061936378479, "created_at": "2025-06-03T04:35:08.141278+00:00"} {"global_step": 231239, "acc_step": 0, "speed/wps": 5512.393109303297, "speed/FLOPS": 243619560445521.9, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.41 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.41, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043399080634117126, "optim/lr": 2.7533561183425317e-05, "optim/total_tokens": 1939773325312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3080899715423584, "created_at": "2025-06-03T04:35:11.121338+00:00"} {"global_step": 231240, "acc_step": 0, "speed/wps": 5528.745953756587, "speed/FLOPS": 244342272468911.72, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04187683016061783, "optim/lr": 2.7530013958330767e-05, "optim/total_tokens": 1939781713920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3027245998382568, "created_at": "2025-06-03T04:35:14.089096+00:00"} {"global_step": 231241, "acc_step": 0, "speed/wps": 5525.30332086978, "speed/FLOPS": 244190125716307.3, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04195578768849373, "optim/lr": 2.752646673323622e-05, "optim/total_tokens": 1939790102528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3053829669952393, "created_at": "2025-06-03T04:35:17.060209+00:00"} {"global_step": 231242, "acc_step": 0, "speed/wps": 5511.217829188963, "speed/FLOPS": 243567619080097.3, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044309623539447784, "optim/lr": 2.7522919508141674e-05, "optim/total_tokens": 1939798491136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.316866159439087, "created_at": "2025-06-03T04:35:20.037402+00:00"} {"global_step": 231243, "acc_step": 0, "speed/wps": 5514.138853720253, "speed/FLOPS": 243696713413221.4, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041462939232587814, "optim/lr": 2.751937228304735e-05, "optim/total_tokens": 1939806879744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2916830778121948, "created_at": "2025-06-03T04:35:23.013591+00:00"} {"global_step": 231244, "acc_step": 0, "speed/wps": 5519.205854823782, "speed/FLOPS": 243920648926734.66, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0478346012532711, "optim/lr": 2.7515825057952805e-05, "optim/total_tokens": 1939815268352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3184956312179565, "created_at": "2025-06-03T04:35:25.988506+00:00"} {"global_step": 231245, "acc_step": 0, "speed/wps": 5512.24998657075, "speed/FLOPS": 243613235153311.88, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.4 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.4, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0547955222427845, "optim/lr": 2.7512277832858255e-05, "optim/total_tokens": 1939823656960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2962315082550049, "created_at": "2025-06-03T04:35:28.969222+00:00"} {"global_step": 231246, "acc_step": 0, "speed/wps": 5498.928037847241, "speed/FLOPS": 243024473207647.75, "speed/curr_iter_time": 2.9786, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9786, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.42 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.42, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042095642536878586, "optim/lr": 2.750873060776371e-05, "optim/total_tokens": 1939832045568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2955161333084106, "created_at": "2025-06-03T04:35:31.952517+00:00"} {"global_step": 231247, "acc_step": 0, "speed/wps": 5517.6123133606425, "speed/FLOPS": 243850222550548.5, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.054162606596946716, "optim/lr": 2.7505183382669386e-05, "optim/total_tokens": 1939840434176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3054983615875244, "created_at": "2025-06-03T04:35:34.929764+00:00"} {"global_step": 231248, "acc_step": 0, "speed/wps": 5522.007565513416, "speed/FLOPS": 244044470198761.2, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04170569032430649, "optim/lr": 2.750163615757484e-05, "optim/total_tokens": 1939848822784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.293031096458435, "created_at": "2025-06-03T04:35:37.900592+00:00"} {"global_step": 231249, "acc_step": 0, "speed/wps": 5524.229758895011, "speed/FLOPS": 244142679772010.88, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05263384431600571, "optim/lr": 2.7498088932480293e-05, "optim/total_tokens": 1939857211392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.291826844215393, "created_at": "2025-06-03T04:35:40.870178+00:00"} {"global_step": 231250, "acc_step": 0, "speed/wps": 5527.155608514008, "speed/FLOPS": 244271987349314.6, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041928429156541824, "optim/lr": 2.7494541707385744e-05, "optim/total_tokens": 1939865600000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3013510704040527, "created_at": "2025-06-03T04:35:43.837967+00:00"} {"global_step": 231251, "acc_step": 0, "speed/wps": 5516.403306021863, "speed/FLOPS": 243796790614434.97, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.05026155337691307, "optim/lr": 2.749099448229142e-05, "optim/total_tokens": 1939873988608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3093833923339844, "created_at": "2025-06-03T04:35:46.811704+00:00"} {"global_step": 231252, "acc_step": 0, "speed/wps": 5521.744671247882, "speed/FLOPS": 244032851617839.4, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041311487555503845, "optim/lr": 2.7487447257196874e-05, "optim/total_tokens": 1939882377216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2938193082809448, "created_at": "2025-06-03T04:35:49.786430+00:00"} {"global_step": 231253, "acc_step": 0, "speed/wps": 5523.254742840207, "speed/FLOPS": 244099589052973.1, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.045458145439624786, "optim/lr": 2.7483900032102328e-05, "optim/total_tokens": 1939890765824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.311631679534912, "created_at": "2025-06-03T04:35:52.760047+00:00"} {"global_step": 231254, "acc_step": 0, "speed/wps": 5521.410162757328, "speed/FLOPS": 244018068054726.6, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04325052723288536, "optim/lr": 2.7480352807008002e-05, "optim/total_tokens": 1939899154432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.279728651046753, "created_at": "2025-06-03T04:35:55.734718+00:00"} {"global_step": 231255, "acc_step": 0, "speed/wps": 5513.556184771939, "speed/FLOPS": 243670962428075.97, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04871053993701935, "optim/lr": 2.7476805581913455e-05, "optim/total_tokens": 1939907543040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.299292802810669, "created_at": "2025-06-03T04:35:58.713769+00:00"} {"global_step": 231256, "acc_step": 0, "speed/wps": 5515.595023565852, "speed/FLOPS": 243761068667043.97, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04111742600798607, "optim/lr": 2.747325835681891e-05, "optim/total_tokens": 1939915931648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.294423222541809, "created_at": "2025-06-03T04:36:01.692516+00:00"} {"global_step": 231257, "acc_step": 0, "speed/wps": 5529.435589059374, "speed/FLOPS": 244372750819421.44, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043914321810007095, "optim/lr": 2.7469711131724363e-05, "optim/total_tokens": 1939924320256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2811423540115356, "created_at": "2025-06-03T04:36:04.659853+00:00"} {"global_step": 231258, "acc_step": 0, "speed/wps": 5520.8455588728975, "speed/FLOPS": 243993115452939.4, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04227125644683838, "optim/lr": 2.7466163906630037e-05, "optim/total_tokens": 1939932708864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.278828740119934, "created_at": "2025-06-03T04:36:07.631541+00:00"} {"global_step": 231259, "acc_step": 0, "speed/wps": 5525.0860210014225, "speed/FLOPS": 244180522174367.47, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.049258098006248474, "optim/lr": 2.746261668153549e-05, "optim/total_tokens": 1939941097472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2817195653915405, "created_at": "2025-06-03T04:36:10.600122+00:00"} {"global_step": 231260, "acc_step": 0, "speed/wps": 5509.75645039897, "speed/FLOPS": 243503033617594.3, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.39 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.39, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04186325892806053, "optim/lr": 2.7459069456440944e-05, "optim/total_tokens": 1939949486080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2833175659179688, "created_at": "2025-06-03T04:36:13.580486+00:00"} {"global_step": 231261, "acc_step": 0, "speed/wps": 5534.183601590487, "speed/FLOPS": 244582588670765.4, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.06, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04866510629653931, "optim/lr": 2.7455522231346397e-05, "optim/total_tokens": 1939957874688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3059062957763672, "created_at": "2025-06-03T04:36:16.544351+00:00"} {"global_step": 231262, "acc_step": 0, "speed/wps": 5516.8656861237805, "speed/FLOPS": 243817225448263.84, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.38 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.38, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04177917167544365, "optim/lr": 2.745197500625207e-05, "optim/total_tokens": 1939966263296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2906087636947632, "created_at": "2025-06-03T04:36:19.517452+00:00"} {"global_step": 231263, "acc_step": 0, "speed/wps": 5533.516990928295, "speed/FLOPS": 244553127891519.2, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04670112207531929, "optim/lr": 2.7448427781157525e-05, "optim/total_tokens": 1939974651904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.293766736984253, "created_at": "2025-06-03T04:36:22.486139+00:00"} {"global_step": 231264, "acc_step": 0, "speed/wps": 5523.9096252174095, "speed/FLOPS": 244128531502053.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043330639600753784, "optim/lr": 2.744488055606298e-05, "optim/total_tokens": 1939983040512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2949094772338867, "created_at": "2025-06-03T04:36:25.457586+00:00"} {"global_step": 231265, "acc_step": 0, "speed/wps": 5518.958736987515, "speed/FLOPS": 243909727583235.4, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044197678565979004, "optim/lr": 2.7441333330968432e-05, "optim/total_tokens": 1939991429120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.298287272453308, "created_at": "2025-06-03T04:36:28.432880+00:00"} {"global_step": 231266, "acc_step": 0, "speed/wps": 5525.624583261442, "speed/FLOPS": 244204323869648.8, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.042156293988227844, "optim/lr": 2.7437786105874106e-05, "optim/total_tokens": 1939999817728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2904866933822632, "created_at": "2025-06-03T04:36:31.406079+00:00"} {"global_step": 231267, "acc_step": 0, "speed/wps": 5523.924248358858, "speed/FLOPS": 244129177770057.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.043047480285167694, "optim/lr": 2.743423888077956e-05, "optim/total_tokens": 1940008206336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3113181591033936, "created_at": "2025-06-03T04:36:34.376117+00:00"} {"global_step": 231268, "acc_step": 0, "speed/wps": 5522.208687411708, "speed/FLOPS": 244053358757230.47, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04153444990515709, "optim/lr": 2.7430691655685013e-05, "optim/total_tokens": 1940016594944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2959904670715332, "created_at": "2025-06-03T04:36:37.351195+00:00"} {"global_step": 231269, "acc_step": 0, "speed/wps": 5520.007051908892, "speed/FLOPS": 243956057736998.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04380765184760094, "optim/lr": 2.7427144430590467e-05, "optim/total_tokens": 1940024983552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3017131090164185, "created_at": "2025-06-03T04:36:40.324946+00:00"} {"global_step": 231270, "acc_step": 0, "speed/wps": 5517.607318150953, "speed/FLOPS": 243850001787848.03, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041475363075733185, "optim/lr": 2.7423597205496144e-05, "optim/total_tokens": 1940033372160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2972482442855835, "created_at": "2025-06-03T04:36:43.301962+00:00"} {"global_step": 231271, "acc_step": 0, "speed/wps": 5526.654090582135, "speed/FLOPS": 244249822823727.25, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04920046776533127, "optim/lr": 2.7420049980401594e-05, "optim/total_tokens": 1940041760768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2971848249435425, "created_at": "2025-06-03T04:36:46.272668+00:00"} {"global_step": 231272, "acc_step": 0, "speed/wps": 5520.66254119144, "speed/FLOPS": 243985027008188.4, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046049654483795166, "optim/lr": 2.7416502755307048e-05, "optim/total_tokens": 1940050149376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3043172359466553, "created_at": "2025-06-03T04:36:49.245020+00:00"} {"global_step": 231273, "acc_step": 0, "speed/wps": 5527.476088590993, "speed/FLOPS": 244286150928351.56, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044441331177949905, "optim/lr": 2.74129555302125e-05, "optim/total_tokens": 1940058537984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2968287467956543, "created_at": "2025-06-03T04:36:52.214195+00:00"} {"global_step": 231274, "acc_step": 0, "speed/wps": 5529.187839774784, "speed/FLOPS": 244361801569138.34, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045527536422014236, "optim/lr": 2.740940830511818e-05, "optim/total_tokens": 1940066926592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2904436588287354, "created_at": "2025-06-03T04:36:55.182320+00:00"} {"global_step": 231275, "acc_step": 0, "speed/wps": 5522.934852630096, "speed/FLOPS": 244085451543032.72, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.044806551188230515, "optim/lr": 2.7405861080023632e-05, "optim/total_tokens": 1940075315200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.3084501028060913, "created_at": "2025-06-03T04:36:58.153479+00:00"} {"global_step": 231276, "acc_step": 0, "speed/wps": 5530.530415459509, "speed/FLOPS": 244421136542477.84, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05148104950785637, "optim/lr": 2.7402313854929082e-05, "optim/total_tokens": 1940083703808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2924320697784424, "created_at": "2025-06-03T04:37:01.124650+00:00"} {"global_step": 231277, "acc_step": 0, "speed/wps": 5522.071135088356, "speed/FLOPS": 244047279648594.94, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.04456440731883049, "optim/lr": 2.7398766629834536e-05, "optim/total_tokens": 1940092092416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3122073411941528, "created_at": "2025-06-03T04:37:04.095798+00:00"} {"global_step": 231278, "acc_step": 0, "speed/wps": 5516.029283034627, "speed/FLOPS": 243780260712822.34, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.0565871000289917, "optim/lr": 2.7395219404740213e-05, "optim/total_tokens": 1940100481024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2998287677764893, "created_at": "2025-06-03T04:37:07.074221+00:00"} {"global_step": 231279, "acc_step": 0, "speed/wps": 5511.923429126888, "speed/FLOPS": 243598802985765.7, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.37 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.37, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.041660573333501816, "optim/lr": 2.7391672179645667e-05, "optim/total_tokens": 1940108869632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.298543930053711, "created_at": "2025-06-03T04:37:10.054377+00:00"} {"global_step": 231280, "acc_step": 0, "speed/wps": 5522.723210292591, "speed/FLOPS": 244076098034998.66, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.06034010276198387, "optim/lr": 2.738812495455112e-05, "optim/total_tokens": 1940117258240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2999870777130127, "created_at": "2025-06-03T04:37:13.027592+00:00"} {"global_step": 231281, "acc_step": 0, "speed/wps": 5524.473953027719, "speed/FLOPS": 244153471902777.7, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04222649708390236, "optim/lr": 2.7384577729456794e-05, "optim/total_tokens": 1940125646848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.299302577972412, "created_at": "2025-06-03T04:37:15.999857+00:00"} {"global_step": 231282, "acc_step": 0, "speed/wps": 5531.516618968945, "speed/FLOPS": 244464721689747.78, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04447772726416588, "optim/lr": 2.7381030504362248e-05, "optim/total_tokens": 1940134035456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2891861200332642, "created_at": "2025-06-03T04:37:18.965683+00:00"} {"global_step": 231283, "acc_step": 0, "speed/wps": 5534.9372143703795, "speed/FLOPS": 244615894498296.75, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04482812061905861, "optim/lr": 2.73774832792677e-05, "optim/total_tokens": 1940142424064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2871253490447998, "created_at": "2025-06-03T04:37:21.933586+00:00"} {"global_step": 231284, "acc_step": 0, "speed/wps": 5526.424951595546, "speed/FLOPS": 244239696053359.7, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04457987844944, "optim/lr": 2.7373936054173155e-05, "optim/total_tokens": 1940150812672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2961442470550537, "created_at": "2025-06-03T04:37:24.905461+00:00"} {"global_step": 231285, "acc_step": 0, "speed/wps": 5517.603953116994, "speed/FLOPS": 243849853070570.84, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04376216232776642, "optim/lr": 2.737038882907883e-05, "optim/total_tokens": 1940159201280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2837556600570679, "created_at": "2025-06-03T04:37:27.880372+00:00"} {"global_step": 231286, "acc_step": 0, "speed/wps": 5518.736097221931, "speed/FLOPS": 243899888045170.22, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04238971322774887, "optim/lr": 2.7366841603984282e-05, "optim/total_tokens": 1940167589888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3043028116226196, "created_at": "2025-06-03T04:37:30.852910+00:00"} {"global_step": 231287, "acc_step": 0, "speed/wps": 5513.769253275806, "speed/FLOPS": 243680378965363.4, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046342141926288605, "optim/lr": 2.7363294378889736e-05, "optim/total_tokens": 1940175978496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2912734746932983, "created_at": "2025-06-03T04:37:33.827960+00:00"} {"global_step": 231288, "acc_step": 0, "speed/wps": 5511.71290270283, "speed/FLOPS": 243589498795394.28, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0025, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04214545339345932, "optim/lr": 2.735974715379519e-05, "optim/total_tokens": 1940184367104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2938846349716187, "created_at": "2025-06-03T04:37:36.804138+00:00"} {"global_step": 231289, "acc_step": 0, "speed/wps": 5520.998203153224, "speed/FLOPS": 243999861548825.56, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04590115696191788, "optim/lr": 2.7356199928700864e-05, "optim/total_tokens": 1940192755712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3044755458831787, "created_at": "2025-06-03T04:37:39.776972+00:00"} {"global_step": 231290, "acc_step": 0, "speed/wps": 5527.72082166625, "speed/FLOPS": 244296966877620.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04193134233355522, "optim/lr": 2.7352652703606317e-05, "optim/total_tokens": 1940201144320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3146557807922363, "created_at": "2025-06-03T04:37:42.748185+00:00"} {"global_step": 231291, "acc_step": 0, "speed/wps": 5532.282426679752, "speed/FLOPS": 244498566470806.22, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04723885655403137, "optim/lr": 2.734910547851177e-05, "optim/total_tokens": 1940209532928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.287872314453125, "created_at": "2025-06-03T04:37:45.713927+00:00"} {"global_step": 231292, "acc_step": 0, "speed/wps": 5531.558098850877, "speed/FLOPS": 244466554888215.9, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.18, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04100773110985756, "optim/lr": 2.7345558253417224e-05, "optim/total_tokens": 1940217921536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2997368574142456, "created_at": "2025-06-03T04:37:48.678986+00:00"} {"global_step": 231293, "acc_step": 0, "speed/wps": 5509.902597407164, "speed/FLOPS": 243509492567308.3, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.27, "optim/grad_norm": 0.046914272010326385, "optim/lr": 2.7342011028322898e-05, "optim/total_tokens": 1940226310144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2881345748901367, "created_at": "2025-06-03T04:37:51.657075+00:00"} {"global_step": 231294, "acc_step": 0, "speed/wps": 5521.405581769206, "speed/FLOPS": 244017865598499.22, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04316949471831322, "optim/lr": 2.7338463803228352e-05, "optim/total_tokens": 1940234698752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2913436889648438, "created_at": "2025-06-03T04:37:54.628290+00:00"} {"global_step": 231295, "acc_step": 0, "speed/wps": 5520.9080292095805, "speed/FLOPS": 243995876322068.62, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.051896966993808746, "optim/lr": 2.7334916578133805e-05, "optim/total_tokens": 1940243087360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2798242568969727, "created_at": "2025-06-03T04:37:57.599474+00:00"} {"global_step": 231296, "acc_step": 0, "speed/wps": 5526.140055805482, "speed/FLOPS": 244227105117667.72, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041588615626096725, "optim/lr": 2.733136935303926e-05, "optim/total_tokens": 1940251475968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2983402013778687, "created_at": "2025-06-03T04:38:00.568084+00:00"} {"global_step": 231297, "acc_step": 0, "speed/wps": 5523.002041884801, "speed/FLOPS": 244088420964184.88, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.050592951476573944, "optim/lr": 2.7327822127944936e-05, "optim/total_tokens": 1940259864576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3085582256317139, "created_at": "2025-06-03T04:38:03.543842+00:00"} {"global_step": 231298, "acc_step": 0, "speed/wps": 5523.769010165236, "speed/FLOPS": 244122317036480.6, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04217088595032692, "optim/lr": 2.7324274902850386e-05, "optim/total_tokens": 1940268253184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.301080584526062, "created_at": "2025-06-03T04:38:06.516887+00:00"} {"global_step": 231299, "acc_step": 0, "speed/wps": 5531.311785871117, "speed/FLOPS": 244455669115254.6, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.26, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04390145093202591, "optim/lr": 2.732072767775584e-05, "optim/total_tokens": 1940276641792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2925888299942017, "created_at": "2025-06-03T04:38:09.483553+00:00"} {"global_step": 231300, "acc_step": 0, "speed/wps": 5532.7475244396455, "speed/FLOPS": 244519121411207.4, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.21, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042143434286117554, "optim/lr": 2.7317180452661294e-05, "optim/total_tokens": 1940285030400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2972755432128906, "created_at": "2025-06-03T04:38:12.450537+00:00"} {"global_step": 231301, "acc_step": 0, "speed/wps": 243.67122026744804, "speed/FLOPS": 10769020713452.428, "speed/curr_iter_time": 2.8935, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.8935, "speed/est_time_elapsed": "7.75 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 185.91, "speed/est_time_elapsed_days": 7.75, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.050830673426389694, "optim/lr": 2.731363322756697e-05, "optim/total_tokens": 1940293419008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2953808307647705, "created_at": "2025-06-03T04:39:19.695033+00:00"} {"global_step": 231302, "acc_step": 0, "speed/wps": 5631.4916369866, "speed/FLOPS": 248883105767597.5, "speed/curr_iter_time": 2.9078, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9078, "speed/est_time_elapsed": "7.78 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 186.83, "speed/est_time_elapsed_days": 7.78, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04101080074906349, "optim/lr": 2.7310086002472424e-05, "optim/total_tokens": 1940301807616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3030519485473633, "created_at": "2025-06-03T04:39:22.611796+00:00"} {"global_step": 231303, "acc_step": 0, "speed/wps": 5609.146468040171, "speed/FLOPS": 247895563673108.2, "speed/curr_iter_time": 2.9199, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9199, "speed/est_time_elapsed": "7.82 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 187.61, "speed/est_time_elapsed_days": 7.82, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04734283313155174, "optim/lr": 2.7306538777377875e-05, "optim/total_tokens": 1940310196224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.294633388519287, "created_at": "2025-06-03T04:39:25.536473+00:00"} {"global_step": 231304, "acc_step": 0, "speed/wps": 5556.705807508029, "speed/FLOPS": 245577954893220.53, "speed/curr_iter_time": 2.9464, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9464, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 189.31, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04201563447713852, "optim/lr": 2.7302991552283328e-05, "optim/total_tokens": 1940318584832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3071140050888062, "created_at": "2025-06-03T04:39:28.493282+00:00"} {"global_step": 231305, "acc_step": 0, "speed/wps": 5548.506091869378, "speed/FLOPS": 245215569431941.5, "speed/curr_iter_time": 2.9519, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9519, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04923541098833084, "optim/lr": 2.7299444327189006e-05, "optim/total_tokens": 1940326973440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3059145212173462, "created_at": "2025-06-03T04:39:31.454899+00:00"} {"global_step": 231306, "acc_step": 0, "speed/wps": 5539.995878894121, "speed/FLOPS": 244839461577653.88, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 189.96, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04219769313931465, "optim/lr": 2.729589710209446e-05, "optim/total_tokens": 1940335362048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3009028434753418, "created_at": "2025-06-03T04:39:34.420316+00:00"} {"global_step": 231307, "acc_step": 0, "speed/wps": 5539.669420001645, "speed/FLOPS": 244825033765574.56, "speed/curr_iter_time": 2.9557, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9557, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045675717294216156, "optim/lr": 2.7292349876999913e-05, "optim/total_tokens": 1940343750656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.3122602701187134, "created_at": "2025-06-03T04:39:37.384840+00:00"} {"global_step": 231308, "acc_step": 0, "speed/wps": 5505.441043992967, "speed/FLOPS": 243312314742701.34, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.36 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.36, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04330584779381752, "optim/lr": 2.7288802651905587e-05, "optim/total_tokens": 1940352139264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3054229021072388, "created_at": "2025-06-03T04:39:40.367946+00:00"} {"global_step": 231309, "acc_step": 0, "speed/wps": 5522.162943924404, "speed/FLOPS": 244051337129228.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04970458894968033, "optim/lr": 2.728525542681104e-05, "optim/total_tokens": 1940360527872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2873239517211914, "created_at": "2025-06-03T04:39:43.344104+00:00"} {"global_step": 231310, "acc_step": 0, "speed/wps": 5508.3002353601705, "speed/FLOPS": 243438676366463.66, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.35 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.35, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0412113182246685, "optim/lr": 2.7281708201716494e-05, "optim/total_tokens": 1940368916480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2882499694824219, "created_at": "2025-06-03T04:39:46.326238+00:00"} {"global_step": 231311, "acc_step": 0, "speed/wps": 5541.831413975942, "speed/FLOPS": 244920582833150.16, "speed/curr_iter_time": 2.9556, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9556, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 189.91, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0482664592564106, "optim/lr": 2.7278160976621947e-05, "optim/total_tokens": 1940377305088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2817007303237915, "created_at": "2025-06-03T04:39:49.289863+00:00"} {"global_step": 231312, "acc_step": 0, "speed/wps": 5538.81247252432, "speed/FLOPS": 244787161073331.56, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.01, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041103068739175797, "optim/lr": 2.727461375152762e-05, "optim/total_tokens": 1940385693696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2875419855117798, "created_at": "2025-06-03T04:39:52.252145+00:00"} {"global_step": 231313, "acc_step": 0, "speed/wps": 5544.699734390378, "speed/FLOPS": 245047347914073.4, "speed/curr_iter_time": 2.9541, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9541, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 189.81, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.050607725977897644, "optim/lr": 2.7271066526433075e-05, "optim/total_tokens": 1940394082304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2910317182540894, "created_at": "2025-06-03T04:39:55.215387+00:00"} {"global_step": 231314, "acc_step": 0, "speed/wps": 5531.787415403428, "speed/FLOPS": 244476689506090.12, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.2, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04642488434910774, "optim/lr": 2.726751930133853e-05, "optim/total_tokens": 1940402470912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2964664697647095, "created_at": "2025-06-03T04:39:58.181427+00:00"} {"global_step": 231315, "acc_step": 0, "speed/wps": 5517.499367415798, "speed/FLOPS": 243845230917896.12, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.34 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.34, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04671676456928253, "optim/lr": 2.7263972076243982e-05, "optim/total_tokens": 1940410859520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2979471683502197, "created_at": "2025-06-03T04:40:01.158653+00:00"} {"global_step": 231316, "acc_step": 0, "speed/wps": 5523.468493107674, "speed/FLOPS": 244109035720722.06, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041238319128751755, "optim/lr": 2.7260424851149656e-05, "optim/total_tokens": 1940419248128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.299955129623413, "created_at": "2025-06-03T04:40:04.131909+00:00"} {"global_step": 231317, "acc_step": 0, "speed/wps": 5545.0653900034185, "speed/FLOPS": 245063508020574.72, "speed/curr_iter_time": 2.9529, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9529, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 189.74, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04475264251232147, "optim/lr": 2.725687762605511e-05, "optim/total_tokens": 1940427636736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3009159564971924, "created_at": "2025-06-03T04:40:07.095959+00:00"} {"global_step": 231318, "acc_step": 0, "speed/wps": 5522.9025739678145, "speed/FLOPS": 244084024991377.03, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04162546619772911, "optim/lr": 2.7253330400960563e-05, "optim/total_tokens": 1940436025344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2998065948486328, "created_at": "2025-06-03T04:40:10.070866+00:00"} {"global_step": 231319, "acc_step": 0, "speed/wps": 5550.6812131325805, "speed/FLOPS": 245311698658495.16, "speed/curr_iter_time": 2.951, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.951, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 189.62, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0466301292181015, "optim/lr": 2.7249783175866017e-05, "optim/total_tokens": 1940444413952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2940497398376465, "created_at": "2025-06-03T04:40:13.031079+00:00"} {"global_step": 231320, "acc_step": 0, "speed/wps": 5539.932898649031, "speed/FLOPS": 244836678173183.0, "speed/curr_iter_time": 2.9558, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9558, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 189.93, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045663099735975266, "optim/lr": 2.724623595077169e-05, "optim/total_tokens": 1940452802560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3031014204025269, "created_at": "2025-06-03T04:40:15.992631+00:00"} {"global_step": 231321, "acc_step": 0, "speed/wps": 5545.627394514453, "speed/FLOPS": 245088345743362.6, "speed/curr_iter_time": 2.9536, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9536, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 189.79, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043871279805898666, "optim/lr": 2.7242688725677144e-05, "optim/total_tokens": 1940461191168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2927967309951782, "created_at": "2025-06-03T04:40:18.952081+00:00"} {"global_step": 231322, "acc_step": 0, "speed/wps": 5542.738555410102, "speed/FLOPS": 244960673841369.22, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 189.89, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04649018123745918, "optim/lr": 2.7239141500582598e-05, "optim/total_tokens": 1940469579776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2952855825424194, "created_at": "2025-06-03T04:40:21.915017+00:00"} {"global_step": 231323, "acc_step": 0, "speed/wps": 5529.111112514205, "speed/FLOPS": 244358410616946.47, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041266173124313354, "optim/lr": 2.723559427548805e-05, "optim/total_tokens": 1940477968384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.301818609237671, "created_at": "2025-06-03T04:40:24.885359+00:00"} {"global_step": 231324, "acc_step": 0, "speed/wps": 5529.280397209899, "speed/FLOPS": 244365892134018.5, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042466215789318085, "optim/lr": 2.7232047050393725e-05, "optim/total_tokens": 1940486356992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.308201551437378, "created_at": "2025-06-03T04:40:27.855971+00:00"} {"global_step": 231325, "acc_step": 0, "speed/wps": 5528.955703423963, "speed/FLOPS": 244351542330613.6, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041003189980983734, "optim/lr": 2.722849982529918e-05, "optim/total_tokens": 1940494745600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.29249107837677, "created_at": "2025-06-03T04:40:30.829122+00:00"} {"global_step": 231326, "acc_step": 0, "speed/wps": 5512.330617768477, "speed/FLOPS": 243616798639543.53, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043812476098537445, "optim/lr": 2.7224952600204632e-05, "optim/total_tokens": 1940503134208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2925411462783813, "created_at": "2025-06-03T04:40:33.808836+00:00"} {"global_step": 231327, "acc_step": 0, "speed/wps": 5531.644654425213, "speed/FLOPS": 244470380201569.94, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.22, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04184747487306595, "optim/lr": 2.7221405375110086e-05, "optim/total_tokens": 1940511522816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2982654571533203, "created_at": "2025-06-03T04:40:36.774774+00:00"} {"global_step": 231328, "acc_step": 0, "speed/wps": 5535.772367842638, "speed/FLOPS": 244652804007067.62, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041833098977804184, "optim/lr": 2.7217858150015763e-05, "optim/total_tokens": 1940519911424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2784184217453003, "created_at": "2025-06-03T04:40:39.740483+00:00"} {"global_step": 231329, "acc_step": 0, "speed/wps": 5528.266312458376, "speed/FLOPS": 244321074778557.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041593555361032486, "optim/lr": 2.7214310924921213e-05, "optim/total_tokens": 1940528300032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.298759937286377, "created_at": "2025-06-03T04:40:42.708965+00:00"} {"global_step": 231330, "acc_step": 0, "speed/wps": 5536.153102824788, "speed/FLOPS": 244669630544500.34, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0411938838660717, "optim/lr": 2.7210763699826667e-05, "optim/total_tokens": 1940536688640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3017632961273193, "created_at": "2025-06-03T04:40:45.676017+00:00"} {"global_step": 231331, "acc_step": 0, "speed/wps": 5528.684613384646, "speed/FLOPS": 244339561538440.38, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04341048374772072, "optim/lr": 2.720721647473212e-05, "optim/total_tokens": 1940545077248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.302725911140442, "created_at": "2025-06-03T04:40:48.647120+00:00"} {"global_step": 231332, "acc_step": 0, "speed/wps": 5529.097864701181, "speed/FLOPS": 244357825131419.25, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041200097650289536, "optim/lr": 2.7203669249637798e-05, "optim/total_tokens": 1940553465856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3081036806106567, "created_at": "2025-06-03T04:40:51.619446+00:00"} {"global_step": 231333, "acc_step": 0, "speed/wps": 5514.4933318622, "speed/FLOPS": 243712379532711.84, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04138088971376419, "optim/lr": 2.720012202454325e-05, "optim/total_tokens": 1940561854464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2981548309326172, "created_at": "2025-06-03T04:40:54.596442+00:00"} {"global_step": 231334, "acc_step": 0, "speed/wps": 5522.58000096529, "speed/FLOPS": 244069768915743.78, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04304266348481178, "optim/lr": 2.7196574799448705e-05, "optim/total_tokens": 1940570243072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3099254369735718, "created_at": "2025-06-03T04:40:57.567969+00:00"} {"global_step": 231335, "acc_step": 0, "speed/wps": 5506.264906497738, "speed/FLOPS": 243348725248501.62, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.33 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.33, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041807450354099274, "optim/lr": 2.719302757435438e-05, "optim/total_tokens": 1940578631680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.285498857498169, "created_at": "2025-06-03T04:41:00.551085+00:00"} {"global_step": 231336, "acc_step": 0, "speed/wps": 5513.664864737569, "speed/FLOPS": 243675765526282.3, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04390599951148033, "optim/lr": 2.7189480349259833e-05, "optim/total_tokens": 1940587020288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.309267282485962, "created_at": "2025-06-03T04:41:03.528008+00:00"} {"global_step": 231337, "acc_step": 0, "speed/wps": 5522.464755643416, "speed/FLOPS": 244064675662395.94, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04421006143093109, "optim/lr": 2.7185933124165286e-05, "optim/total_tokens": 1940595408896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2988786697387695, "created_at": "2025-06-03T04:41:06.498291+00:00"} {"global_step": 231338, "acc_step": 0, "speed/wps": 5519.789577403214, "speed/FLOPS": 243946446476982.53, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04501907154917717, "optim/lr": 2.718238589907074e-05, "optim/total_tokens": 1940603797504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2945556640625, "created_at": "2025-06-03T04:41:09.470194+00:00"} {"global_step": 231339, "acc_step": 0, "speed/wps": 5529.512013786369, "speed/FLOPS": 244376128401177.38, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.048383280634880066, "optim/lr": 2.7178838673976414e-05, "optim/total_tokens": 1940612186112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2934566736221313, "created_at": "2025-06-03T04:41:12.437239+00:00"} {"global_step": 231340, "acc_step": 0, "speed/wps": 5527.96386629453, "speed/FLOPS": 244307708206175.28, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04192035645246506, "optim/lr": 2.7175291448881867e-05, "optim/total_tokens": 1940620574720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3016175031661987, "created_at": "2025-06-03T04:41:15.410346+00:00"} {"global_step": 231341, "acc_step": 0, "speed/wps": 5524.15843644283, "speed/FLOPS": 244139527684685.84, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05129735916852951, "optim/lr": 2.717174422378732e-05, "optim/total_tokens": 1940628963328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2963312864303589, "created_at": "2025-06-03T04:41:18.379829+00:00"} {"global_step": 231342, "acc_step": 0, "speed/wps": 5531.42996478726, "speed/FLOPS": 244460892018453.62, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04161583259701729, "optim/lr": 2.7168196998692774e-05, "optim/total_tokens": 1940637351936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2912616729736328, "created_at": "2025-06-03T04:41:21.348304+00:00"} {"global_step": 231343, "acc_step": 0, "speed/wps": 5523.729233543988, "speed/FLOPS": 244120559113416.62, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05289817601442337, "optim/lr": 2.7164649773598448e-05, "optim/total_tokens": 1940645740544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3019070625305176, "created_at": "2025-06-03T04:41:24.321300+00:00"} {"global_step": 231344, "acc_step": 0, "speed/wps": 5524.899310828092, "speed/FLOPS": 244172270540375.56, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04752972349524498, "optim/lr": 2.7161102548503902e-05, "optim/total_tokens": 1940654129152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.302446722984314, "created_at": "2025-06-03T04:41:27.295080+00:00"} {"global_step": 231345, "acc_step": 0, "speed/wps": 5523.053593291089, "speed/FLOPS": 244090699272478.8, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04673832282423973, "optim/lr": 2.7157555323409355e-05, "optim/total_tokens": 1940662517760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.298056960105896, "created_at": "2025-06-03T04:41:30.268193+00:00"} {"global_step": 231346, "acc_step": 0, "speed/wps": 5537.59468977759, "speed/FLOPS": 244733341309103.28, "speed/curr_iter_time": 2.958, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.958, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.09, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.051933903247117996, "optim/lr": 2.715400809831481e-05, "optim/total_tokens": 1940670906368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2923473119735718, "created_at": "2025-06-03T04:41:33.230717+00:00"} {"global_step": 231347, "acc_step": 0, "speed/wps": 5530.1922231377075, "speed/FLOPS": 244406190172879.47, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041877955198287964, "optim/lr": 2.7150460873220483e-05, "optim/total_tokens": 1940679294976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294945240020752, "created_at": "2025-06-03T04:41:36.200190+00:00"} {"global_step": 231348, "acc_step": 0, "speed/wps": 5527.646330050028, "speed/FLOPS": 244293674729466.16, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04741867259144783, "optim/lr": 2.7146913648125936e-05, "optim/total_tokens": 1940687683584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2781777381896973, "created_at": "2025-06-03T04:41:39.172676+00:00"} {"global_step": 231349, "acc_step": 0, "speed/wps": 5504.140717929101, "speed/FLOPS": 243254846986350.6, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.32 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.32, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04218349605798721, "optim/lr": 2.714336642303139e-05, "optim/total_tokens": 1940696072192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.309137225151062, "created_at": "2025-06-03T04:41:42.153156+00:00"} {"global_step": 231350, "acc_step": 0, "speed/wps": 5523.973092892299, "speed/FLOPS": 244131336448426.7, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.052711255848407745, "optim/lr": 2.7139819197936844e-05, "optim/total_tokens": 1940704460800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.308255672454834, "created_at": "2025-06-03T04:41:45.124819+00:00"} {"global_step": 231351, "acc_step": 0, "speed/wps": 5512.828480390996, "speed/FLOPS": 243638801619167.0, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04315188154578209, "optim/lr": 2.7136271972842518e-05, "optim/total_tokens": 1940712849408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2879101037979126, "created_at": "2025-06-03T04:41:48.101355+00:00"} {"global_step": 231352, "acc_step": 0, "speed/wps": 5528.73196142592, "speed/FLOPS": 244341654079515.47, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.4, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04968077689409256, "optim/lr": 2.713272474774797e-05, "optim/total_tokens": 1940721238016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2961556911468506, "created_at": "2025-06-03T04:41:51.068269+00:00"} {"global_step": 231353, "acc_step": 0, "speed/wps": 5532.0603933045595, "speed/FLOPS": 244488753732092.56, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04197625443339348, "optim/lr": 2.7129177522653425e-05, "optim/total_tokens": 1940729626624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2972220182418823, "created_at": "2025-06-03T04:41:54.033317+00:00"} {"global_step": 231354, "acc_step": 0, "speed/wps": 5534.214075418571, "speed/FLOPS": 244583935457987.53, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.16, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04532656818628311, "optim/lr": 2.712563029755888e-05, "optim/total_tokens": 1940738015232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2983287572860718, "created_at": "2025-06-03T04:41:56.997709+00:00"} {"global_step": 231355, "acc_step": 0, "speed/wps": 5518.3842515931565, "speed/FLOPS": 243884338269287.56, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04330778121948242, "optim/lr": 2.7122083072464556e-05, "optim/total_tokens": 1940746403840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.285603642463684, "created_at": "2025-06-03T04:41:59.973499+00:00"} {"global_step": 231356, "acc_step": 0, "speed/wps": 5525.847054088829, "speed/FLOPS": 244214155941510.4, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05015755817294121, "optim/lr": 2.7118535847370006e-05, "optim/total_tokens": 1940754792448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2831158638000488, "created_at": "2025-06-03T04:42:02.943098+00:00"} {"global_step": 231357, "acc_step": 0, "speed/wps": 5520.128784527849, "speed/FLOPS": 243961437695671.97, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04641421511769295, "optim/lr": 2.711498862227546e-05, "optim/total_tokens": 1940763181056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3023111820220947, "created_at": "2025-06-03T04:42:05.914778+00:00"} {"global_step": 231358, "acc_step": 0, "speed/wps": 5518.692543245265, "speed/FLOPS": 243897963182331.06, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04802219942212105, "optim/lr": 2.7111441397180913e-05, "optim/total_tokens": 1940771569664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2982593774795532, "created_at": "2025-06-03T04:42:08.887084+00:00"} {"global_step": 231359, "acc_step": 0, "speed/wps": 5514.429129836846, "speed/FLOPS": 243709542131806.97, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04562363401055336, "optim/lr": 2.710789417208659e-05, "optim/total_tokens": 1940779958272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3098307847976685, "created_at": "2025-06-03T04:42:11.861870+00:00"} {"global_step": 231360, "acc_step": 0, "speed/wps": 5515.815070491659, "speed/FLOPS": 243770793614862.34, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04378876835107803, "optim/lr": 2.7104346946992044e-05, "optim/total_tokens": 1940788346880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2976611852645874, "created_at": "2025-06-03T04:42:14.837664+00:00"} {"global_step": 231361, "acc_step": 0, "speed/wps": 5522.224796638946, "speed/FLOPS": 244054070702619.9, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04867689311504364, "optim/lr": 2.7100799721897494e-05, "optim/total_tokens": 1940796735488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2956918478012085, "created_at": "2025-06-03T04:42:17.808077+00:00"} {"global_step": 231362, "acc_step": 0, "speed/wps": 5521.329829773277, "speed/FLOPS": 244014517748013.03, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05039254203438759, "optim/lr": 2.709725249680317e-05, "optim/total_tokens": 1940805124096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2980329990386963, "created_at": "2025-06-03T04:42:20.778896+00:00"} {"global_step": 231363, "acc_step": 0, "speed/wps": 5520.984785836531, "speed/FLOPS": 243999268572103.8, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04278391972184181, "optim/lr": 2.7093705271708625e-05, "optim/total_tokens": 1940813512704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2882370948791504, "created_at": "2025-06-03T04:42:23.751462+00:00"} {"global_step": 231364, "acc_step": 0, "speed/wps": 5514.740609212044, "speed/FLOPS": 243723307925894.75, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05090084299445152, "optim/lr": 2.709015804661408e-05, "optim/total_tokens": 1940821901312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.303934097290039, "created_at": "2025-06-03T04:42:26.729969+00:00"} {"global_step": 231365, "acc_step": 0, "speed/wps": 5524.933341900051, "speed/FLOPS": 244173774539569.34, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04289672523736954, "optim/lr": 2.7086610821519532e-05, "optim/total_tokens": 1940830289920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2964414358139038, "created_at": "2025-06-03T04:42:29.703229+00:00"} {"global_step": 231366, "acc_step": 0, "speed/wps": 5519.595631118872, "speed/FLOPS": 243937875043921.72, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05181283876299858, "optim/lr": 2.7083063596425206e-05, "optim/total_tokens": 1940838678528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2983697652816772, "created_at": "2025-06-03T04:42:32.679770+00:00"} {"global_step": 231367, "acc_step": 0, "speed/wps": 5525.432311869127, "speed/FLOPS": 244195826458242.7, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042241934686899185, "optim/lr": 2.707951637133066e-05, "optim/total_tokens": 1940847067136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3047850131988525, "created_at": "2025-06-03T04:42:35.652683+00:00"} {"global_step": 231368, "acc_step": 0, "speed/wps": 5504.6609250062, "speed/FLOPS": 243277837476497.2, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.31 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.31, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.048799265176057816, "optim/lr": 2.7075969146236113e-05, "optim/total_tokens": 1940855455744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3072701692581177, "created_at": "2025-06-03T04:42:38.635847+00:00"} {"global_step": 231369, "acc_step": 0, "speed/wps": 5518.448238915665, "speed/FLOPS": 243887166181425.62, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042974043637514114, "optim/lr": 2.7072421921141567e-05, "optim/total_tokens": 1940863844352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3056342601776123, "created_at": "2025-06-03T04:42:41.608721+00:00"} {"global_step": 231370, "acc_step": 0, "speed/wps": 5536.823138735302, "speed/FLOPS": 244699242702190.34, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.050219953060150146, "optim/lr": 2.706887469604724e-05, "optim/total_tokens": 1940872232960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3082705736160278, "created_at": "2025-06-03T04:42:44.571594+00:00"} {"global_step": 231371, "acc_step": 0, "speed/wps": 5514.494265731872, "speed/FLOPS": 243712420804971.38, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047893162816762924, "optim/lr": 2.7065327470952694e-05, "optim/total_tokens": 1940880621568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.282584309577942, "created_at": "2025-06-03T04:42:47.547322+00:00"} {"global_step": 231372, "acc_step": 0, "speed/wps": 5510.257002262358, "speed/FLOPS": 243525155447899.38, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05404849350452423, "optim/lr": 2.7061780245858148e-05, "optim/total_tokens": 1940889010176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2972978353500366, "created_at": "2025-06-03T04:42:50.523935+00:00"} {"global_step": 231373, "acc_step": 0, "speed/wps": 5529.804564317516, "speed/FLOPS": 244389057637244.72, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045036617666482925, "optim/lr": 2.70582330207636e-05, "optim/total_tokens": 1940897398784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.316330909729004, "created_at": "2025-06-03T04:42:53.493730+00:00"} {"global_step": 231374, "acc_step": 0, "speed/wps": 5516.333480228644, "speed/FLOPS": 243793704671775.5, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04951418191194534, "optim/lr": 2.7054685795669275e-05, "optim/total_tokens": 1940905787392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2942157983779907, "created_at": "2025-06-03T04:42:56.469608+00:00"} {"global_step": 231375, "acc_step": 0, "speed/wps": 5522.63104042188, "speed/FLOPS": 244072024598481.44, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0425923615694046, "optim/lr": 2.705113857057473e-05, "optim/total_tokens": 1940914176000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2907273769378662, "created_at": "2025-06-03T04:42:59.440296+00:00"} {"global_step": 231376, "acc_step": 0, "speed/wps": 5514.354932935157, "speed/FLOPS": 243706263008526.5, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04520530626177788, "optim/lr": 2.7047591345480182e-05, "optim/total_tokens": 1940922564608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3000808954238892, "created_at": "2025-06-03T04:43:02.415689+00:00"} {"global_step": 231377, "acc_step": 0, "speed/wps": 5505.84304544904, "speed/FLOPS": 243330081149429.78, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04115011543035507, "optim/lr": 2.7044044120385636e-05, "optim/total_tokens": 1940930953216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3077435493469238, "created_at": "2025-06-03T04:43:05.394832+00:00"} {"global_step": 231378, "acc_step": 0, "speed/wps": 5523.707196997817, "speed/FLOPS": 244119585210869.12, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045071590691804886, "optim/lr": 2.704049689529131e-05, "optim/total_tokens": 1940939341824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3009299039840698, "created_at": "2025-06-03T04:43:08.368219+00:00"} {"global_step": 231379, "acc_step": 0, "speed/wps": 5516.127545320971, "speed/FLOPS": 243784603402926.78, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04210245981812477, "optim/lr": 2.7036949670196763e-05, "optim/total_tokens": 1940947730432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3113263845443726, "created_at": "2025-06-03T04:43:11.346412+00:00"} {"global_step": 231380, "acc_step": 0, "speed/wps": 5512.007863618846, "speed/FLOPS": 243602534558135.38, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041979629546403885, "optim/lr": 2.7033402445102217e-05, "optim/total_tokens": 1940956119040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2837952375411987, "created_at": "2025-06-03T04:43:14.322307+00:00"} {"global_step": 231381, "acc_step": 0, "speed/wps": 5523.790089370447, "speed/FLOPS": 244123248629457.78, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04157029092311859, "optim/lr": 2.702985522000767e-05, "optim/total_tokens": 1940964507648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3141767978668213, "created_at": "2025-06-03T04:43:17.299216+00:00"} {"global_step": 231382, "acc_step": 0, "speed/wps": 5508.717173510861, "speed/FLOPS": 243457102898641.28, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0419587567448616, "optim/lr": 2.7026307994913345e-05, "optim/total_tokens": 1940972896256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2919498682022095, "created_at": "2025-06-03T04:43:20.281724+00:00"} {"global_step": 231383, "acc_step": 0, "speed/wps": 5511.613977843447, "speed/FLOPS": 243585126822952.88, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.29 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.29, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04233422130346298, "optim/lr": 2.7022760769818798e-05, "optim/total_tokens": 1940981284864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.300775170326233, "created_at": "2025-06-03T04:43:23.258241+00:00"} {"global_step": 231384, "acc_step": 0, "speed/wps": 5499.400087322498, "speed/FLOPS": 243045335378285.84, "speed/curr_iter_time": 2.9777, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9777, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.3 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.3, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04755505174398422, "optim/lr": 2.7019213544724252e-05, "optim/total_tokens": 1940989673472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2935569286346436, "created_at": "2025-06-03T04:43:26.245812+00:00"} {"global_step": 231385, "acc_step": 0, "speed/wps": 5515.581309557091, "speed/FLOPS": 243760462578051.38, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04162244126200676, "optim/lr": 2.7015666319629705e-05, "optim/total_tokens": 1940998062080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.30983567237854, "created_at": "2025-06-03T04:43:29.220893+00:00"} {"global_step": 231386, "acc_step": 0, "speed/wps": 5520.068224559202, "speed/FLOPS": 243958761255031.75, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04545014724135399, "optim/lr": 2.7012119094535383e-05, "optim/total_tokens": 1941006450688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2854633331298828, "created_at": "2025-06-03T04:43:32.196315+00:00"} {"global_step": 231387, "acc_step": 0, "speed/wps": 5527.132776644404, "speed/FLOPS": 244270978297542.16, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043853309005498886, "optim/lr": 2.7008571869440833e-05, "optim/total_tokens": 1941014839296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3000210523605347, "created_at": "2025-06-03T04:43:35.165026+00:00"} {"global_step": 231388, "acc_step": 0, "speed/wps": 5512.43993948021, "speed/FLOPS": 243621630099642.9, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045842766761779785, "optim/lr": 2.7005024644346286e-05, "optim/total_tokens": 1941023227904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2996221780776978, "created_at": "2025-06-03T04:43:38.145536+00:00"} {"global_step": 231389, "acc_step": 0, "speed/wps": 5515.344281806163, "speed/FLOPS": 243749987164678.38, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04618668928742409, "optim/lr": 2.7001477419251964e-05, "optim/total_tokens": 1941031616512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2927114963531494, "created_at": "2025-06-03T04:43:41.119688+00:00"} {"global_step": 231390, "acc_step": 0, "speed/wps": 5515.762396860871, "speed/FLOPS": 243768465709989.62, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04370102286338806, "optim/lr": 2.6997930194157417e-05, "optim/total_tokens": 1941040005120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3089967966079712, "created_at": "2025-06-03T04:43:44.095607+00:00"} {"global_step": 231391, "acc_step": 0, "speed/wps": 5513.844473485922, "speed/FLOPS": 243683703313638.62, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04371741786599159, "optim/lr": 2.699438296906287e-05, "optim/total_tokens": 1941048393728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2983931303024292, "created_at": "2025-06-03T04:43:47.070785+00:00"} {"global_step": 231392, "acc_step": 0, "speed/wps": 5518.18056083733, "speed/FLOPS": 243875336180463.8, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047679442912340164, "optim/lr": 2.6990835743968324e-05, "optim/total_tokens": 1941056782336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3071284294128418, "created_at": "2025-06-03T04:43:50.043389+00:00"} {"global_step": 231393, "acc_step": 0, "speed/wps": 5510.837476940601, "speed/FLOPS": 243550809457539.0, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04239920899271965, "optim/lr": 2.6987288518873998e-05, "optim/total_tokens": 1941065170944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2891489267349243, "created_at": "2025-06-03T04:43:53.024246+00:00"} {"global_step": 231394, "acc_step": 0, "speed/wps": 5515.246253613502, "speed/FLOPS": 243745654820316.53, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.046922262758016586, "optim/lr": 2.6983741293779452e-05, "optim/total_tokens": 1941073559552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2823154926300049, "created_at": "2025-06-03T04:43:56.002604+00:00"} {"global_step": 231395, "acc_step": 0, "speed/wps": 5519.765724347501, "speed/FLOPS": 243945392294011.06, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042363107204437256, "optim/lr": 2.6980194068684905e-05, "optim/total_tokens": 1941081948160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3099701404571533, "created_at": "2025-06-03T04:43:58.978914+00:00"} {"global_step": 231396, "acc_step": 0, "speed/wps": 5510.157855674944, "speed/FLOPS": 243520773676213.9, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05105724558234215, "optim/lr": 2.697664684359036e-05, "optim/total_tokens": 1941090336768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3032699823379517, "created_at": "2025-06-03T04:44:01.959482+00:00"} {"global_step": 231397, "acc_step": 0, "speed/wps": 5522.160542734021, "speed/FLOPS": 244051231008903.53, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0415872223675251, "optim/lr": 2.6973099618496033e-05, "optim/total_tokens": 1941098725376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2877086400985718, "created_at": "2025-06-03T04:44:04.931324+00:00"} {"global_step": 231398, "acc_step": 0, "speed/wps": 5524.850947883588, "speed/FLOPS": 244170133145772.47, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.051381394267082214, "optim/lr": 2.6969552393401487e-05, "optim/total_tokens": 1941107113984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2798305749893188, "created_at": "2025-06-03T04:44:07.904867+00:00"} {"global_step": 231399, "acc_step": 0, "speed/wps": 5518.569995406845, "speed/FLOPS": 243892547195129.6, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04315973073244095, "optim/lr": 2.696600516830694e-05, "optim/total_tokens": 1941115502592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.303306221961975, "created_at": "2025-06-03T04:44:10.881000+00:00"} {"global_step": 231400, "acc_step": 0, "speed/wps": 5509.036306407026, "speed/FLOPS": 243471206939181.53, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.054191503673791885, "optim/lr": 2.6962457943212394e-05, "optim/total_tokens": 1941123891200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2886155843734741, "created_at": "2025-06-03T04:44:13.858480+00:00"} {"global_step": 231401, "acc_step": 0, "speed/wps": 5507.15026819843, "speed/FLOPS": 243387853703980.25, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04483149200677872, "optim/lr": 2.6958910718118068e-05, "optim/total_tokens": 1941132279808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.306738018989563, "created_at": "2025-06-03T04:44:16.839121+00:00"} {"global_step": 231402, "acc_step": 0, "speed/wps": 5507.631497062306, "speed/FLOPS": 243409121556610.94, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.28 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.28, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.050947774201631546, "optim/lr": 2.695536349302352e-05, "optim/total_tokens": 1941140668416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3009512424468994, "created_at": "2025-06-03T04:44:19.821120+00:00"} {"global_step": 231403, "acc_step": 0, "speed/wps": 5518.887483919445, "speed/FLOPS": 243906578562332.97, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04398278519511223, "optim/lr": 2.6951816267928975e-05, "optim/total_tokens": 1941149057024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3098076581954956, "created_at": "2025-06-03T04:44:22.793921+00:00"} {"global_step": 231404, "acc_step": 0, "speed/wps": 5521.333228812324, "speed/FLOPS": 244014667968141.03, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04688697308301926, "optim/lr": 2.694826904283443e-05, "optim/total_tokens": 1941157445632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3042559623718262, "created_at": "2025-06-03T04:44:25.768059+00:00"} {"global_step": 231405, "acc_step": 0, "speed/wps": 5519.7982304704265, "speed/FLOPS": 243946828898262.94, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04478476569056511, "optim/lr": 2.6944721817740102e-05, "optim/total_tokens": 1941165834240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2988343238830566, "created_at": "2025-06-03T04:44:28.743846+00:00"} {"global_step": 231406, "acc_step": 0, "speed/wps": 5516.7328182412775, "speed/FLOPS": 243811353367936.7, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043283749371767044, "optim/lr": 2.6941174592645556e-05, "optim/total_tokens": 1941174222848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.306481957435608, "created_at": "2025-06-03T04:44:31.720174+00:00"} {"global_step": 231407, "acc_step": 0, "speed/wps": 5517.584507558227, "speed/FLOPS": 243848993676404.75, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04252000153064728, "optim/lr": 2.693762736755101e-05, "optim/total_tokens": 1941182611456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.294847846031189, "created_at": "2025-06-03T04:44:34.693140+00:00"} {"global_step": 231408, "acc_step": 0, "speed/wps": 5509.538522358261, "speed/FLOPS": 243493402313651.8, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04203306883573532, "optim/lr": 2.6934080142456463e-05, "optim/total_tokens": 1941191000064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3014496564865112, "created_at": "2025-06-03T04:44:37.673949+00:00"} {"global_step": 231409, "acc_step": 0, "speed/wps": 5514.403580295112, "speed/FLOPS": 243708412972836.75, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04172100871801376, "optim/lr": 2.6930532917362137e-05, "optim/total_tokens": 1941199388672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3015775680541992, "created_at": "2025-06-03T04:44:40.653677+00:00"} {"global_step": 231410, "acc_step": 0, "speed/wps": 5508.202914434471, "speed/FLOPS": 243434375279681.38, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.27 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.27, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.045866914093494415, "optim/lr": 2.692698569226759e-05, "optim/total_tokens": 1941207777280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2917287349700928, "created_at": "2025-06-03T04:44:43.633068+00:00"} {"global_step": 231411, "acc_step": 0, "speed/wps": 5517.194120251513, "speed/FLOPS": 243831740555631.34, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0440678596496582, "optim/lr": 2.6923438467173044e-05, "optim/total_tokens": 1941216165888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2934123277664185, "created_at": "2025-06-03T04:44:46.606323+00:00"} {"global_step": 231412, "acc_step": 0, "speed/wps": 5513.778063316012, "speed/FLOPS": 243680768324046.66, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04133716970682144, "optim/lr": 2.6919891242078498e-05, "optim/total_tokens": 1941224554496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2973233461380005, "created_at": "2025-06-03T04:44:49.581359+00:00"} {"global_step": 231413, "acc_step": 0, "speed/wps": 5517.3765489782545, "speed/FLOPS": 243839802971598.47, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04206908866763115, "optim/lr": 2.6916344016984175e-05, "optim/total_tokens": 1941232943104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3036346435546875, "created_at": "2025-06-03T04:44:52.559843+00:00"} {"global_step": 231414, "acc_step": 0, "speed/wps": 5522.383362247759, "speed/FLOPS": 244061078490917.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043610166758298874, "optim/lr": 2.6912796791889625e-05, "optim/total_tokens": 1941241331712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2923952341079712, "created_at": "2025-06-03T04:44:55.530454+00:00"} {"global_step": 231415, "acc_step": 0, "speed/wps": 5521.738442794699, "speed/FLOPS": 244032576352088.84, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04487896338105202, "optim/lr": 2.690924956679508e-05, "optim/total_tokens": 1941249720320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2879247665405273, "created_at": "2025-06-03T04:44:58.501272+00:00"} {"global_step": 231416, "acc_step": 0, "speed/wps": 5517.833966832634, "speed/FLOPS": 243860018499485.22, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041670698672533035, "optim/lr": 2.6905702341700756e-05, "optim/total_tokens": 1941258108928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.299980878829956, "created_at": "2025-06-03T04:45:01.474915+00:00"} {"global_step": 231417, "acc_step": 0, "speed/wps": 5511.563475945774, "speed/FLOPS": 243582894897567.88, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04295619949698448, "optim/lr": 2.690215511660621e-05, "optim/total_tokens": 1941266497536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.286307692527771, "created_at": "2025-06-03T04:45:04.455182+00:00"} {"global_step": 231418, "acc_step": 0, "speed/wps": 5504.60115736789, "speed/FLOPS": 243275196052802.38, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 191.22, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04300067946314812, "optim/lr": 2.6898607891511663e-05, "optim/total_tokens": 1941274886144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.294800877571106, "created_at": "2025-06-03T04:45:07.437989+00:00"} {"global_step": 231419, "acc_step": 0, "speed/wps": 5510.1666192291605, "speed/FLOPS": 243521160980454.38, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04410463199019432, "optim/lr": 2.6895060666417113e-05, "optim/total_tokens": 1941283274752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.282923936843872, "created_at": "2025-06-03T04:45:10.419641+00:00"} {"global_step": 231420, "acc_step": 0, "speed/wps": 5518.400756560727, "speed/FLOPS": 243885067704374.12, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04920591413974762, "optim/lr": 2.689151344132279e-05, "optim/total_tokens": 1941291663360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3142712116241455, "created_at": "2025-06-03T04:45:13.392603+00:00"} {"global_step": 231421, "acc_step": 0, "speed/wps": 5521.776960640993, "speed/FLOPS": 244034278643742.8, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04348710551857948, "optim/lr": 2.6887966216228244e-05, "optim/total_tokens": 1941300051968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2924469709396362, "created_at": "2025-06-03T04:45:16.368809+00:00"} {"global_step": 231422, "acc_step": 0, "speed/wps": 5512.256919054587, "speed/FLOPS": 243613541533613.84, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.26 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.26, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043517932295799255, "optim/lr": 2.6884418991133698e-05, "optim/total_tokens": 1941308440576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.29770827293396, "created_at": "2025-06-03T04:45:19.346280+00:00"} {"global_step": 231423, "acc_step": 0, "speed/wps": 5522.082644501216, "speed/FLOPS": 244047788305732.84, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044447146356105804, "optim/lr": 2.688087176603915e-05, "optim/total_tokens": 1941316829184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.300559639930725, "created_at": "2025-06-03T04:45:22.321904+00:00"} {"global_step": 231424, "acc_step": 0, "speed/wps": 5523.1495964406195, "speed/FLOPS": 244094942120299.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04146882891654968, "optim/lr": 2.6877324540944825e-05, "optim/total_tokens": 1941325217792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2707353830337524, "created_at": "2025-06-03T04:45:25.292749+00:00"} {"global_step": 231425, "acc_step": 0, "speed/wps": 5518.542330992043, "speed/FLOPS": 243891324569594.66, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043546825647354126, "optim/lr": 2.687377731585028e-05, "optim/total_tokens": 1941333606400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3090852499008179, "created_at": "2025-06-03T04:45:28.269892+00:00"} {"global_step": 231426, "acc_step": 0, "speed/wps": 5516.414051036848, "speed/FLOPS": 243797265489099.34, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04358314722776413, "optim/lr": 2.6870230090755732e-05, "optim/total_tokens": 1941341995008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2955657243728638, "created_at": "2025-06-03T04:45:31.245453+00:00"} {"global_step": 231427, "acc_step": 0, "speed/wps": 5513.569143076235, "speed/FLOPS": 243671535118799.25, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042173560708761215, "optim/lr": 2.6866682865661186e-05, "optim/total_tokens": 1941350383616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3088922500610352, "created_at": "2025-06-03T04:45:34.226388+00:00"} {"global_step": 231428, "acc_step": 0, "speed/wps": 5517.163888941873, "speed/FLOPS": 243830404486483.12, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04531659930944443, "optim/lr": 2.686313564056686e-05, "optim/total_tokens": 1941358772224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2989896535873413, "created_at": "2025-06-03T04:45:37.199980+00:00"} {"global_step": 231429, "acc_step": 0, "speed/wps": 5526.074001806387, "speed/FLOPS": 244224185869002.72, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04155011102557182, "optim/lr": 2.6859588415472314e-05, "optim/total_tokens": 1941367160832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2939702272415161, "created_at": "2025-06-03T04:45:40.168368+00:00"} {"global_step": 231430, "acc_step": 0, "speed/wps": 5527.845468067792, "speed/FLOPS": 244302475610570.56, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04472444951534271, "optim/lr": 2.6856041190377767e-05, "optim/total_tokens": 1941375549440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2979215383529663, "created_at": "2025-06-03T04:45:43.138879+00:00"} {"global_step": 231431, "acc_step": 0, "speed/wps": 5519.966801615257, "speed/FLOPS": 243954278880039.1, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04357612133026123, "optim/lr": 2.685249396528322e-05, "optim/total_tokens": 1941383938048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3066219091415405, "created_at": "2025-06-03T04:45:46.110668+00:00"} {"global_step": 231432, "acc_step": 0, "speed/wps": 5522.201676137495, "speed/FLOPS": 244053048894797.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04603634029626846, "optim/lr": 2.6848946740188895e-05, "optim/total_tokens": 1941392326656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2810733318328857, "created_at": "2025-06-03T04:45:49.080903+00:00"} {"global_step": 231433, "acc_step": 0, "speed/wps": 5529.625996537237, "speed/FLOPS": 244381165855349.16, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04694649949669838, "optim/lr": 2.6845399515094348e-05, "optim/total_tokens": 1941400715264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.282043218612671, "created_at": "2025-06-03T04:45:52.048001+00:00"} {"global_step": 231434, "acc_step": 0, "speed/wps": 5517.000564363558, "speed/FLOPS": 243823186376092.56, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04129219427704811, "optim/lr": 2.6841852289999802e-05, "optim/total_tokens": 1941409103872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2983086109161377, "created_at": "2025-06-03T04:45:55.023036+00:00"} {"global_step": 231435, "acc_step": 0, "speed/wps": 5505.799656398404, "speed/FLOPS": 243328163575476.97, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.25 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.25, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04450313374400139, "optim/lr": 2.6838305064905255e-05, "optim/total_tokens": 1941417492480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2821317911148071, "created_at": "2025-06-03T04:45:58.003981+00:00"} {"global_step": 231436, "acc_step": 0, "speed/wps": 5526.86683433664, "speed/FLOPS": 244259225008755.12, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04130068048834801, "optim/lr": 2.683475783981093e-05, "optim/total_tokens": 1941425881088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3027623891830444, "created_at": "2025-06-03T04:46:00.972126+00:00"} {"global_step": 231437, "acc_step": 0, "speed/wps": 5527.260296214871, "speed/FLOPS": 244276614009852.5, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04546790570020676, "optim/lr": 2.6831210614716383e-05, "optim/total_tokens": 1941434269696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.299513339996338, "created_at": "2025-06-03T04:46:03.944987+00:00"} {"global_step": 231438, "acc_step": 0, "speed/wps": 5508.783709795372, "speed/FLOPS": 243460043461853.06, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04323361814022064, "optim/lr": 2.6827663389621836e-05, "optim/total_tokens": 1941442658304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2881412506103516, "created_at": "2025-06-03T04:46:06.926056+00:00"} {"global_step": 231439, "acc_step": 0, "speed/wps": 5514.764650510014, "speed/FLOPS": 243724370428210.5, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.24 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.24, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04299679771065712, "optim/lr": 2.682411616452729e-05, "optim/total_tokens": 1941451046912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.31165611743927, "created_at": "2025-06-03T04:46:09.903444+00:00"} {"global_step": 231440, "acc_step": 0, "speed/wps": 5521.004387486089, "speed/FLOPS": 244000134864683.97, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04186549410223961, "optim/lr": 2.6820568939432964e-05, "optim/total_tokens": 1941459435520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2842004299163818, "created_at": "2025-06-03T04:46:12.874341+00:00"} {"global_step": 231441, "acc_step": 0, "speed/wps": 5516.690423815798, "speed/FLOPS": 243809479751324.8, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047107383608818054, "optim/lr": 2.6817021714338417e-05, "optim/total_tokens": 1941467824128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2984570264816284, "created_at": "2025-06-03T04:46:15.847492+00:00"} {"global_step": 231442, "acc_step": 0, "speed/wps": 5517.318595172505, "speed/FLOPS": 243837241710018.8, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04155867546796799, "optim/lr": 2.681347448924387e-05, "optim/total_tokens": 1941476212736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3023614883422852, "created_at": "2025-06-03T04:46:18.822459+00:00"} {"global_step": 231443, "acc_step": 0, "speed/wps": 5524.613197371907, "speed/FLOPS": 244159625790073.6, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04409864544868469, "optim/lr": 2.6809927264149548e-05, "optim/total_tokens": 1941484601344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2902190685272217, "created_at": "2025-06-03T04:46:21.791674+00:00"} {"global_step": 231444, "acc_step": 0, "speed/wps": 5524.619401083205, "speed/FLOPS": 244159899962359.53, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042285382747650146, "optim/lr": 2.6806380039055002e-05, "optim/total_tokens": 1941492989952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2991664409637451, "created_at": "2025-06-03T04:46:24.760824+00:00"} {"global_step": 231445, "acc_step": 0, "speed/wps": 5531.531800285707, "speed/FLOPS": 244465392626243.62, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 190.31, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04373016580939293, "optim/lr": 2.6802832813960456e-05, "optim/total_tokens": 1941501378560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2956422567367554, "created_at": "2025-06-03T04:46:27.726897+00:00"} {"global_step": 231446, "acc_step": 0, "speed/wps": 5528.5983298092515, "speed/FLOPS": 244335748246047.3, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04173329100012779, "optim/lr": 2.6799285588865906e-05, "optim/total_tokens": 1941509767168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2901467084884644, "created_at": "2025-06-03T04:46:30.697223+00:00"} {"global_step": 231447, "acc_step": 0, "speed/wps": 5517.962984454946, "speed/FLOPS": 243865720418019.38, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04272821173071861, "optim/lr": 2.6795738363771583e-05, "optim/total_tokens": 1941518155776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3086574077606201, "created_at": "2025-06-03T04:46:33.670056+00:00"} {"global_step": 231448, "acc_step": 0, "speed/wps": 5518.908561377166, "speed/FLOPS": 243907510078080.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04449804127216339, "optim/lr": 2.6792191138677037e-05, "optim/total_tokens": 1941526544384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2979471683502197, "created_at": "2025-06-03T04:46:36.645674+00:00"} {"global_step": 231449, "acc_step": 0, "speed/wps": 5515.340767369482, "speed/FLOPS": 243749831844565.6, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04184776172041893, "optim/lr": 2.678864391358249e-05, "optim/total_tokens": 1941534932992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2956234216690063, "created_at": "2025-06-03T04:46:39.622351+00:00"} {"global_step": 231450, "acc_step": 0, "speed/wps": 5522.498000876277, "speed/FLOPS": 244066144931523.88, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04544853791594505, "optim/lr": 2.6785096688487944e-05, "optim/total_tokens": 1941543321600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2959800958633423, "created_at": "2025-06-03T04:46:42.593210+00:00"} {"global_step": 231451, "acc_step": 0, "speed/wps": 5516.766527773728, "speed/FLOPS": 243812843156729.97, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041902512311935425, "optim/lr": 2.6781549463393618e-05, "optim/total_tokens": 1941551710208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3178523778915405, "created_at": "2025-06-03T04:46:45.569295+00:00"} {"global_step": 231452, "acc_step": 0, "speed/wps": 5514.991052741813, "speed/FLOPS": 243734376248024.38, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.23 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.23, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043945666402578354, "optim/lr": 2.677800223829907e-05, "optim/total_tokens": 1941560098816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3012094497680664, "created_at": "2025-06-03T04:46:48.544172+00:00"} {"global_step": 231453, "acc_step": 0, "speed/wps": 5521.0363368444805, "speed/FLOPS": 244001546862793.22, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042859289795160294, "optim/lr": 2.6774455013204525e-05, "optim/total_tokens": 1941568487424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2933356761932373, "created_at": "2025-06-03T04:46:51.515318+00:00"} {"global_step": 231454, "acc_step": 0, "speed/wps": 5534.795876696156, "speed/FLOPS": 244609648096527.84, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04229816794395447, "optim/lr": 2.677090778810998e-05, "optim/total_tokens": 1941576876032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2910313606262207, "created_at": "2025-06-03T04:46:54.480373+00:00"} {"global_step": 231455, "acc_step": 0, "speed/wps": 5537.406985528669, "speed/FLOPS": 244725045742058.38, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.13, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04337678477168083, "optim/lr": 2.6767360563015652e-05, "optim/total_tokens": 1941585264640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2978392839431763, "created_at": "2025-06-03T04:46:57.443090+00:00"} {"global_step": 231456, "acc_step": 0, "speed/wps": 5532.778223889, "speed/FLOPS": 244520478169734.84, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04462975263595581, "optim/lr": 2.6763813337921106e-05, "optim/total_tokens": 1941593653248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.307831048965454, "created_at": "2025-06-03T04:47:00.414261+00:00"} {"global_step": 231457, "acc_step": 0, "speed/wps": 5523.750926855477, "speed/FLOPS": 244121517846748.0, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044036250561475754, "optim/lr": 2.676026611282656e-05, "optim/total_tokens": 1941602041856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3076720237731934, "created_at": "2025-06-03T04:47:03.386900+00:00"} {"global_step": 231458, "acc_step": 0, "speed/wps": 5530.273141055638, "speed/FLOPS": 244409766330676.53, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04153139889240265, "optim/lr": 2.6756718887732013e-05, "optim/total_tokens": 1941610430464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2958427667617798, "created_at": "2025-06-03T04:47:06.357587+00:00"} {"global_step": 231459, "acc_step": 0, "speed/wps": 5525.902636082874, "speed/FLOPS": 244216612381152.72, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044383831322193146, "optim/lr": 2.6753171662637687e-05, "optim/total_tokens": 1941618819072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2922710180282593, "created_at": "2025-06-03T04:47:09.326140+00:00"} {"global_step": 231460, "acc_step": 0, "speed/wps": 5525.188884172014, "speed/FLOPS": 244185068200006.2, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04211244732141495, "optim/lr": 2.674962443754314e-05, "optim/total_tokens": 1941627207680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2978284358978271, "created_at": "2025-06-03T04:47:12.300112+00:00"} {"global_step": 231461, "acc_step": 0, "speed/wps": 5517.328932358926, "speed/FLOPS": 243837698560748.1, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.22 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.22, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041768573224544525, "optim/lr": 2.6746077212448594e-05, "optim/total_tokens": 1941635596288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2846193313598633, "created_at": "2025-06-03T04:47:15.273539+00:00"} {"global_step": 231462, "acc_step": 0, "speed/wps": 5536.772022204805, "speed/FLOPS": 244696983613180.5, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.15, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041006941348314285, "optim/lr": 2.6742529987354048e-05, "optim/total_tokens": 1941643984896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2835875749588013, "created_at": "2025-06-03T04:47:18.236678+00:00"} {"global_step": 231463, "acc_step": 0, "speed/wps": 5527.9841593744595, "speed/FLOPS": 244308605056438.78, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04177405312657356, "optim/lr": 2.673898276225972e-05, "optim/total_tokens": 1941652373504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.292220115661621, "created_at": "2025-06-03T04:47:21.208080+00:00"} {"global_step": 231464, "acc_step": 0, "speed/wps": 5532.979121827983, "speed/FLOPS": 244529356830349.03, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.34, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04135159030556679, "optim/lr": 2.6735435537165175e-05, "optim/total_tokens": 1941660762112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2852219343185425, "created_at": "2025-06-03T04:47:24.177454+00:00"} {"global_step": 231465, "acc_step": 0, "speed/wps": 5527.240629713634, "speed/FLOPS": 244275744851160.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.47, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04239262267947197, "optim/lr": 2.673188831207063e-05, "optim/total_tokens": 1941669150720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2778915166854858, "created_at": "2025-06-03T04:47:27.147531+00:00"} {"global_step": 231466, "acc_step": 0, "speed/wps": 5516.340915100259, "speed/FLOPS": 243794033255045.78, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04250945523381233, "optim/lr": 2.6728341086976082e-05, "optim/total_tokens": 1941677539328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2954678535461426, "created_at": "2025-06-03T04:47:30.126355+00:00"} {"global_step": 231467, "acc_step": 0, "speed/wps": 5534.585893070938, "speed/FLOPS": 244600367895086.88, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04091857373714447, "optim/lr": 2.6724793861881756e-05, "optim/total_tokens": 1941685927936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.29239022731781, "created_at": "2025-06-03T04:47:33.093651+00:00"} {"global_step": 231468, "acc_step": 0, "speed/wps": 5525.7443490875285, "speed/FLOPS": 244209616906144.75, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04062140733003616, "optim/lr": 2.672124663678721e-05, "optim/total_tokens": 1941694316544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2933963537216187, "created_at": "2025-06-03T04:47:36.063065+00:00"} {"global_step": 231469, "acc_step": 0, "speed/wps": 5525.872944972805, "speed/FLOPS": 244215300186060.56, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05117632821202278, "optim/lr": 2.6717699411692663e-05, "optim/total_tokens": 1941702705152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3048771619796753, "created_at": "2025-06-03T04:47:39.032951+00:00"} {"global_step": 231470, "acc_step": 0, "speed/wps": 5532.730275806109, "speed/FLOPS": 244518359109891.6, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04115128144621849, "optim/lr": 2.671415218659834e-05, "optim/total_tokens": 1941711093760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2875115871429443, "created_at": "2025-06-03T04:47:41.997972+00:00"} {"global_step": 231471, "acc_step": 0, "speed/wps": 5525.817777539178, "speed/FLOPS": 244212862067866.75, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04268737509846687, "optim/lr": 2.6710604961503794e-05, "optim/total_tokens": 1941719482368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3045759201049805, "created_at": "2025-06-03T04:47:44.967941+00:00"} {"global_step": 231472, "acc_step": 0, "speed/wps": 5530.954254996144, "speed/FLOPS": 244439868080589.72, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04161609336733818, "optim/lr": 2.6707057736409244e-05, "optim/total_tokens": 1941727870976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2950782775878906, "created_at": "2025-06-03T04:47:47.933819+00:00"} {"global_step": 231473, "acc_step": 0, "speed/wps": 5533.96170195208, "speed/FLOPS": 244572781842533.12, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.32, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04433608427643776, "optim/lr": 2.6703510511314698e-05, "optim/total_tokens": 1941736259584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2999199628829956, "created_at": "2025-06-03T04:47:50.903140+00:00"} {"global_step": 231474, "acc_step": 0, "speed/wps": 5526.466795251186, "speed/FLOPS": 244241545328763.75, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04356628656387329, "optim/lr": 2.6699963286220375e-05, "optim/total_tokens": 1941744648192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3019788265228271, "created_at": "2025-06-03T04:47:53.873023+00:00"} {"global_step": 231475, "acc_step": 0, "speed/wps": 5522.93788346094, "speed/FLOPS": 244085585490242.8, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04137874394655228, "optim/lr": 2.669641606112583e-05, "optim/total_tokens": 1941753036800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2928639650344849, "created_at": "2025-06-03T04:47:56.844684+00:00"} {"global_step": 231476, "acc_step": 0, "speed/wps": 5522.500028333552, "speed/FLOPS": 244066234534757.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04262335225939751, "optim/lr": 2.6692868836031282e-05, "optim/total_tokens": 1941761425408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2892067432403564, "created_at": "2025-06-03T04:47:59.815259+00:00"} {"global_step": 231477, "acc_step": 0, "speed/wps": 5520.794658098174, "speed/FLOPS": 243990865899230.44, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04229065403342247, "optim/lr": 2.6689321610936733e-05, "optim/total_tokens": 1941769814016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3061681985855103, "created_at": "2025-06-03T04:48:02.786951+00:00"} {"global_step": 231478, "acc_step": 0, "speed/wps": 5519.866762335501, "speed/FLOPS": 243949857655921.34, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04188059642910957, "optim/lr": 2.668577438584241e-05, "optim/total_tokens": 1941778202624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.312197208404541, "created_at": "2025-06-03T04:48:05.763744+00:00"} {"global_step": 231479, "acc_step": 0, "speed/wps": 5506.779756983236, "speed/FLOPS": 243371479004717.0, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04246033355593681, "optim/lr": 2.6682227160747864e-05, "optim/total_tokens": 1941786591232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3068437576293945, "created_at": "2025-06-03T04:48:08.747368+00:00"} {"global_step": 231480, "acc_step": 0, "speed/wps": 5520.1405144865475, "speed/FLOPS": 243961956099807.06, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04185212031006813, "optim/lr": 2.6678679935653317e-05, "optim/total_tokens": 1941794979840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2936650514602661, "created_at": "2025-06-03T04:48:11.721816+00:00"} {"global_step": 231481, "acc_step": 0, "speed/wps": 5530.377265805862, "speed/FLOPS": 244414368111677.7, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04210079461336136, "optim/lr": 2.667513271055877e-05, "optim/total_tokens": 1941803368448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3172752857208252, "created_at": "2025-06-03T04:48:14.688645+00:00"} {"global_step": 231482, "acc_step": 0, "speed/wps": 5524.122747936452, "speed/FLOPS": 244137950435374.25, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041393574327230453, "optim/lr": 2.6671585485464445e-05, "optim/total_tokens": 1941811757056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2964210510253906, "created_at": "2025-06-03T04:48:17.659205+00:00"} {"global_step": 231483, "acc_step": 0, "speed/wps": 5518.075302915121, "speed/FLOPS": 243870684319061.1, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04205505922436714, "optim/lr": 2.6668038260369898e-05, "optim/total_tokens": 1941820145664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.294180989265442, "created_at": "2025-06-03T04:48:20.632308+00:00"} {"global_step": 231484, "acc_step": 0, "speed/wps": 5516.631833537282, "speed/FLOPS": 243806890360906.62, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04283538833260536, "optim/lr": 2.6664491035275352e-05, "optim/total_tokens": 1941828534272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2932878732681274, "created_at": "2025-06-03T04:48:23.606453+00:00"} {"global_step": 231485, "acc_step": 0, "speed/wps": 5507.667515529998, "speed/FLOPS": 243410713388523.72, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.21 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.21, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041085418313741684, "optim/lr": 2.6660943810180805e-05, "optim/total_tokens": 1941836922880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3100144863128662, "created_at": "2025-06-03T04:48:26.585953+00:00"} {"global_step": 231486, "acc_step": 0, "speed/wps": 5516.613368773077, "speed/FLOPS": 243806074312840.03, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04245198145508766, "optim/lr": 2.665739658508648e-05, "optim/total_tokens": 1941845311488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2942005395889282, "created_at": "2025-06-03T04:48:29.559770+00:00"} {"global_step": 231487, "acc_step": 0, "speed/wps": 5528.696319788989, "speed/FLOPS": 244340078901593.53, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0430317297577858, "optim/lr": 2.6653849359991933e-05, "optim/total_tokens": 1941853700096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2906954288482666, "created_at": "2025-06-03T04:48:32.527782+00:00"} {"global_step": 231488, "acc_step": 0, "speed/wps": 5522.849803896754, "speed/FLOPS": 244081692824337.84, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04366731271147728, "optim/lr": 2.6650302134897386e-05, "optim/total_tokens": 1941862088704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2987558841705322, "created_at": "2025-06-03T04:48:35.498111+00:00"} {"global_step": 231489, "acc_step": 0, "speed/wps": 5526.566276139613, "speed/FLOPS": 244245941874842.88, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04421273618936539, "optim/lr": 2.664675490980284e-05, "optim/total_tokens": 1941870477312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2904707193374634, "created_at": "2025-06-03T04:48:38.468627+00:00"} {"global_step": 231490, "acc_step": 0, "speed/wps": 5521.814010587281, "speed/FLOPS": 244035916061729.94, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047903478145599365, "optim/lr": 2.6643207684708514e-05, "optim/total_tokens": 1941878865920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.297226905822754, "created_at": "2025-06-03T04:48:41.440261+00:00"} {"global_step": 231491, "acc_step": 0, "speed/wps": 5511.496344122382, "speed/FLOPS": 243579928014585.75, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.2 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.2, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04279316961765289, "optim/lr": 2.6639660459613968e-05, "optim/total_tokens": 1941887254528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3078190088272095, "created_at": "2025-06-03T04:48:44.420796+00:00"} {"global_step": 231492, "acc_step": 0, "speed/wps": 5531.008072574811, "speed/FLOPS": 244442246542103.47, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04268583282828331, "optim/lr": 2.663611323451942e-05, "optim/total_tokens": 1941895643136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2951076030731201, "created_at": "2025-06-03T04:48:47.389997+00:00"} {"global_step": 231493, "acc_step": 0, "speed/wps": 5521.064809887849, "speed/FLOPS": 244002805225571.84, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04247744753956795, "optim/lr": 2.6632566009424875e-05, "optim/total_tokens": 1941904031744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2974371910095215, "created_at": "2025-06-03T04:48:50.362488+00:00"} {"global_step": 231494, "acc_step": 0, "speed/wps": 5516.438118603873, "speed/FLOPS": 243798329152372.88, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04252683371305466, "optim/lr": 2.662901878433055e-05, "optim/total_tokens": 1941912420352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2958422899246216, "created_at": "2025-06-03T04:48:53.340588+00:00"} {"global_step": 231495, "acc_step": 0, "speed/wps": 5520.9284563426745, "speed/FLOPS": 243996779096795.84, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04121953621506691, "optim/lr": 2.6625471559236002e-05, "optim/total_tokens": 1941920808960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2907741069793701, "created_at": "2025-06-03T04:48:56.311919+00:00"} {"global_step": 231496, "acc_step": 0, "speed/wps": 5525.040008160252, "speed/FLOPS": 244178488642302.8, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04206782206892967, "optim/lr": 2.6621924334141456e-05, "optim/total_tokens": 1941929197568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2996293306350708, "created_at": "2025-06-03T04:48:59.281332+00:00"} {"global_step": 231497, "acc_step": 0, "speed/wps": 5532.831736778764, "speed/FLOPS": 244522843165558.62, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04154573008418083, "optim/lr": 2.6618377109047133e-05, "optim/total_tokens": 1941937586176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.289318323135376, "created_at": "2025-06-03T04:49:02.249169+00:00"} {"global_step": 231498, "acc_step": 0, "speed/wps": 5407.412228292068, "speed/FLOPS": 238979942845685.72, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.043767184019088745, "optim/lr": 2.6614829883952583e-05, "optim/total_tokens": 1941945974784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2770599126815796, "created_at": "2025-06-03T04:49:05.287602+00:00"} {"global_step": 231499, "acc_step": 0, "speed/wps": 5528.103986252471, "speed/FLOPS": 244313900791117.34, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04216466099023819, "optim/lr": 2.6611282658858037e-05, "optim/total_tokens": 1941954363392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2962446212768555, "created_at": "2025-06-03T04:49:08.259020+00:00"} {"global_step": 231500, "acc_step": 0, "speed/wps": 5521.0552561746335, "speed/FLOPS": 244002383000348.06, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04432769492268562, "optim/lr": 2.660773543376349e-05, "optim/total_tokens": 1941962752000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2922030687332153, "created_at": "2025-06-03T04:49:11.236341+00:00"} {"global_step": 231501, "acc_step": 0, "speed/wps": 5520.1134440272945, "speed/FLOPS": 243960759724067.25, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04151982069015503, "optim/lr": 2.6604188208669168e-05, "optim/total_tokens": 1941971140608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2753809690475464, "created_at": "2025-06-03T04:49:14.214641+00:00"} {"global_step": 231502, "acc_step": 0, "speed/wps": 5515.095968697641, "speed/FLOPS": 243739012996263.4, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.19 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.19, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04718595743179321, "optim/lr": 2.660064098357462e-05, "optim/total_tokens": 1941979529216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.305457592010498, "created_at": "2025-06-03T04:49:17.191020+00:00"} {"global_step": 231503, "acc_step": 0, "speed/wps": 5526.163286111477, "speed/FLOPS": 244228131778289.2, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0490473248064518, "optim/lr": 2.6597093758480075e-05, "optim/total_tokens": 1941987917824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.292090892791748, "created_at": "2025-06-03T04:49:20.160499+00:00"} {"global_step": 231504, "acc_step": 0, "speed/wps": 5540.368986867725, "speed/FLOPS": 244855951040347.44, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.12, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0431290939450264, "optim/lr": 2.6593546533385525e-05, "optim/total_tokens": 1941996306432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3074419498443604, "created_at": "2025-06-03T04:49:23.123842+00:00"} {"global_step": 231505, "acc_step": 0, "speed/wps": 5526.414186642988, "speed/FLOPS": 244239220297556.66, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042295072227716446, "optim/lr": 2.6589999308291202e-05, "optim/total_tokens": 1942004695040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3065478801727295, "created_at": "2025-06-03T04:49:26.092761+00:00"} {"global_step": 231506, "acc_step": 0, "speed/wps": 5525.603263996119, "speed/FLOPS": 244203381667243.4, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04165661334991455, "optim/lr": 2.6586452083196656e-05, "optim/total_tokens": 1942013083648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.307018756866455, "created_at": "2025-06-03T04:49:29.066906+00:00"} {"global_step": 231507, "acc_step": 0, "speed/wps": 5523.567895997021, "speed/FLOPS": 244113428819641.12, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042561888694763184, "optim/lr": 2.658290485810211e-05, "optim/total_tokens": 1942021472256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2980784177780151, "created_at": "2025-06-03T04:49:32.037064+00:00"} {"global_step": 231508, "acc_step": 0, "speed/wps": 5520.588254412883, "speed/FLOPS": 243981743912810.38, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047998663038015366, "optim/lr": 2.6579357633007563e-05, "optim/total_tokens": 1942029860864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3153717517852783, "created_at": "2025-06-03T04:49:35.009200+00:00"} {"global_step": 231509, "acc_step": 0, "speed/wps": 5518.979415468614, "speed/FLOPS": 243910641466257.94, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.18 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.18, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041824229061603546, "optim/lr": 2.6575810407913237e-05, "optim/total_tokens": 1942038249472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2814147472381592, "created_at": "2025-06-03T04:49:37.985417+00:00"} {"global_step": 231510, "acc_step": 0, "speed/wps": 5520.597627637915, "speed/FLOPS": 243982158161380.3, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04933615401387215, "optim/lr": 2.657226318281869e-05, "optim/total_tokens": 1942046638080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2872973680496216, "created_at": "2025-06-03T04:49:40.958724+00:00"} {"global_step": 231511, "acc_step": 0, "speed/wps": 5520.53271604401, "speed/FLOPS": 243979289401177.34, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04366143420338631, "optim/lr": 2.6568715957724144e-05, "optim/total_tokens": 1942055026688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2830901145935059, "created_at": "2025-06-03T04:49:43.931621+00:00"} {"global_step": 231512, "acc_step": 0, "speed/wps": 5528.813946927697, "speed/FLOPS": 244345277419054.16, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.062124837189912796, "optim/lr": 2.6565168732629598e-05, "optim/total_tokens": 1942063415296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2837146520614624, "created_at": "2025-06-03T04:49:46.899525+00:00"} {"global_step": 231513, "acc_step": 0, "speed/wps": 5518.315951270923, "speed/FLOPS": 243881319744637.56, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04978613555431366, "optim/lr": 2.656162150753527e-05, "optim/total_tokens": 1942071803904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2969496250152588, "created_at": "2025-06-03T04:49:49.877635+00:00"} {"global_step": 231514, "acc_step": 0, "speed/wps": 5528.673557719462, "speed/FLOPS": 244339072934627.28, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0532008521258831, "optim/lr": 2.6558074282440725e-05, "optim/total_tokens": 1942080192512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2893986701965332, "created_at": "2025-06-03T04:49:52.849103+00:00"} {"global_step": 231515, "acc_step": 0, "speed/wps": 5522.449380487012, "speed/FLOPS": 244063996159180.06, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05305718258023262, "optim/lr": 2.655452705734618e-05, "optim/total_tokens": 1942088581120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2902392148971558, "created_at": "2025-06-03T04:49:55.824500+00:00"} {"global_step": 231516, "acc_step": 0, "speed/wps": 5515.503765431078, "speed/FLOPS": 243757035524588.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04430411756038666, "optim/lr": 2.6550979832251632e-05, "optim/total_tokens": 1942096969728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.303666114807129, "created_at": "2025-06-03T04:49:58.801078+00:00"} {"global_step": 231517, "acc_step": 0, "speed/wps": 5524.5763969809705, "speed/FLOPS": 244157999401155.7, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05010572820901871, "optim/lr": 2.6547432607157306e-05, "optim/total_tokens": 1942105358336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.291601300239563, "created_at": "2025-06-03T04:50:01.770974+00:00"} {"global_step": 231518, "acc_step": 0, "speed/wps": 5515.020575160006, "speed/FLOPS": 243735680987799.06, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042410362511873245, "optim/lr": 2.654388538206276e-05, "optim/total_tokens": 1942113746944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2931277751922607, "created_at": "2025-06-03T04:50:04.749372+00:00"} {"global_step": 231519, "acc_step": 0, "speed/wps": 5528.465122052531, "speed/FLOPS": 244329861145019.4, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04932379722595215, "optim/lr": 2.6540338156968213e-05, "optim/total_tokens": 1942122135552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2952373027801514, "created_at": "2025-06-03T04:50:07.716928+00:00"} {"global_step": 231520, "acc_step": 0, "speed/wps": 5514.7296649956315, "speed/FLOPS": 243722824247546.9, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04212837293744087, "optim/lr": 2.6536790931873667e-05, "optim/total_tokens": 1942130524160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2961174249649048, "created_at": "2025-06-03T04:50:10.692433+00:00"} {"global_step": 231521, "acc_step": 0, "speed/wps": 5533.684029429064, "speed/FLOPS": 244560510138272.62, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.3, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04962386563420296, "optim/lr": 2.653324370677934e-05, "optim/total_tokens": 1942138912768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2901828289031982, "created_at": "2025-06-03T04:50:13.659172+00:00"} {"global_step": 231522, "acc_step": 0, "speed/wps": 5533.486012194839, "speed/FLOPS": 244551758790063.94, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04287218302488327, "optim/lr": 2.6529696481684794e-05, "optim/total_tokens": 1942147301376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2985111474990845, "created_at": "2025-06-03T04:50:16.628226+00:00"} {"global_step": 231523, "acc_step": 0, "speed/wps": 5525.9608493412425, "speed/FLOPS": 244219185109210.16, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0464387983083725, "optim/lr": 2.6526149256590248e-05, "optim/total_tokens": 1942155689984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2899770736694336, "created_at": "2025-06-03T04:50:19.600995+00:00"} {"global_step": 231524, "acc_step": 0, "speed/wps": 5534.160990171233, "speed/FLOPS": 244581589361770.1, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.35, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.046130307018756866, "optim/lr": 2.6522602031495702e-05, "optim/total_tokens": 1942164078592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3061689138412476, "created_at": "2025-06-03T04:50:22.567866+00:00"} {"global_step": 231525, "acc_step": 0, "speed/wps": 5511.855415137496, "speed/FLOPS": 243595797115561.72, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04338187351822853, "optim/lr": 2.6519054806401376e-05, "optim/total_tokens": 1942172467200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2859693765640259, "created_at": "2025-06-03T04:50:25.545061+00:00"} {"global_step": 231526, "acc_step": 0, "speed/wps": 5509.136483574107, "speed/FLOPS": 243475634257213.28, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04249194636940956, "optim/lr": 2.651550758130683e-05, "optim/total_tokens": 1942180855808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2937332391738892, "created_at": "2025-06-03T04:50:28.529584+00:00"} {"global_step": 231527, "acc_step": 0, "speed/wps": 5514.4959731454965, "speed/FLOPS": 243712496263914.25, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0472397617995739, "optim/lr": 2.6511960356212283e-05, "optim/total_tokens": 1942189244416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3081327676773071, "created_at": "2025-06-03T04:50:31.504329+00:00"} {"global_step": 231528, "acc_step": 0, "speed/wps": 5513.875646158177, "speed/FLOPS": 243685080986196.1, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.052035924047231674, "optim/lr": 2.650841313111796e-05, "optim/total_tokens": 1942197633024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3022007942199707, "created_at": "2025-06-03T04:50:34.481956+00:00"} {"global_step": 231529, "acc_step": 0, "speed/wps": 5508.924845109498, "speed/FLOPS": 243466280920341.4, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042080264538526535, "optim/lr": 2.6504865906023414e-05, "optim/total_tokens": 1942206021632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.308319330215454, "created_at": "2025-06-03T04:50:37.460869+00:00"} {"global_step": 231530, "acc_step": 0, "speed/wps": 5528.642517651155, "speed/FLOPS": 244337701122485.56, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042208969593048096, "optim/lr": 2.6501318680928864e-05, "optim/total_tokens": 1942214410240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2942427396774292, "created_at": "2025-06-03T04:50:40.428613+00:00"} {"global_step": 231531, "acc_step": 0, "speed/wps": 5519.88494622347, "speed/FLOPS": 243950661290696.0, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04480871558189392, "optim/lr": 2.6497771455834317e-05, "optim/total_tokens": 1942222798848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2996753454208374, "created_at": "2025-06-03T04:50:43.403763+00:00"} {"global_step": 231532, "acc_step": 0, "speed/wps": 5524.233707502148, "speed/FLOPS": 244142854280235.5, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.63, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042920004576444626, "optim/lr": 2.6494224230739995e-05, "optim/total_tokens": 1942231187456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2929128408432007, "created_at": "2025-06-03T04:50:46.373939+00:00"} {"global_step": 231533, "acc_step": 0, "speed/wps": 5523.492121509772, "speed/FLOPS": 244110079975153.7, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04325776919722557, "optim/lr": 2.6490677005645448e-05, "optim/total_tokens": 1942239576064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3167667388916016, "created_at": "2025-06-03T04:50:49.344184+00:00"} {"global_step": 231534, "acc_step": 0, "speed/wps": 5514.4332208795995, "speed/FLOPS": 243709722934956.8, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044120579957962036, "optim/lr": 2.6487129780550902e-05, "optim/total_tokens": 1942247964672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3097795248031616, "created_at": "2025-06-03T04:50:52.319474+00:00"} {"global_step": 231535, "acc_step": 0, "speed/wps": 5510.814972167811, "speed/FLOPS": 243549814861771.53, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042298659682273865, "optim/lr": 2.6483582555456352e-05, "optim/total_tokens": 1942256353280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2996397018432617, "created_at": "2025-06-03T04:50:55.297332+00:00"} {"global_step": 231536, "acc_step": 0, "speed/wps": 5508.247445594247, "speed/FLOPS": 243436343329012.38, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.17 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.17, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04477490484714508, "optim/lr": 2.648003533036203e-05, "optim/total_tokens": 1942264741888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3110162019729614, "created_at": "2025-06-03T04:50:58.280353+00:00"} {"global_step": 231537, "acc_step": 0, "speed/wps": 5513.731806166713, "speed/FLOPS": 243678723994813.2, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042590584605932236, "optim/lr": 2.6476488105267483e-05, "optim/total_tokens": 1942273130496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.307615041732788, "created_at": "2025-06-03T04:51:01.256241+00:00"} {"global_step": 231538, "acc_step": 0, "speed/wps": 5523.431012986306, "speed/FLOPS": 244107379291198.28, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.06217775121331215, "optim/lr": 2.6472940880172936e-05, "optim/total_tokens": 1942281519104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3023525476455688, "created_at": "2025-06-03T04:51:04.230558+00:00"} {"global_step": 231539, "acc_step": 0, "speed/wps": 5513.635579318472, "speed/FLOPS": 243674471260654.6, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.16 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.16, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04267667233943939, "optim/lr": 2.646939365507839e-05, "optim/total_tokens": 1942289907712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2966376543045044, "created_at": "2025-06-03T04:51:07.210595+00:00"} {"global_step": 231540, "acc_step": 0, "speed/wps": 5518.886193635914, "speed/FLOPS": 243906521538405.2, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04739529639482498, "optim/lr": 2.6465846429984064e-05, "optim/total_tokens": 1942298296320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.296202301979065, "created_at": "2025-06-03T04:51:10.183715+00:00"} {"global_step": 231541, "acc_step": 0, "speed/wps": 5530.200778032677, "speed/FLOPS": 244406568255449.2, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0423479862511158, "optim/lr": 2.6462299204889518e-05, "optim/total_tokens": 1942306684928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2846523523330688, "created_at": "2025-06-03T04:51:13.156375+00:00"} {"global_step": 231542, "acc_step": 0, "speed/wps": 5512.57066555581, "speed/FLOPS": 243627407523067.7, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.05230068415403366, "optim/lr": 2.645875197979497e-05, "optim/total_tokens": 1942315073536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2974375486373901, "created_at": "2025-06-03T04:51:16.132506+00:00"} {"global_step": 231543, "acc_step": 0, "speed/wps": 5520.212317400888, "speed/FLOPS": 243965129421100.28, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04249592870473862, "optim/lr": 2.6455204754700425e-05, "optim/total_tokens": 1942323462144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3053076267242432, "created_at": "2025-06-03T04:51:19.104172+00:00"} {"global_step": 231544, "acc_step": 0, "speed/wps": 5530.465145330293, "speed/FLOPS": 244418251936849.34, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.049544185400009155, "optim/lr": 2.64516575296061e-05, "optim/total_tokens": 1942331850752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2928504943847656, "created_at": "2025-06-03T04:51:22.076019+00:00"} {"global_step": 231545, "acc_step": 0, "speed/wps": 5510.487104180445, "speed/FLOPS": 243535324774910.47, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04252233728766441, "optim/lr": 2.6448110304511552e-05, "optim/total_tokens": 1942340239360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3214126825332642, "created_at": "2025-06-03T04:51:25.056293+00:00"} {"global_step": 231546, "acc_step": 0, "speed/wps": 5524.493715213978, "speed/FLOPS": 244154345290258.28, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04913735017180443, "optim/lr": 2.6444563079417006e-05, "optim/total_tokens": 1942348627968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3076313734054565, "created_at": "2025-06-03T04:51:28.026113+00:00"} {"global_step": 231547, "acc_step": 0, "speed/wps": 5529.582938789318, "speed/FLOPS": 244379262923280.66, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04205500707030296, "optim/lr": 2.644101585432246e-05, "optim/total_tokens": 1942357016576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3120208978652954, "created_at": "2025-06-03T04:51:30.992980+00:00"} {"global_step": 231548, "acc_step": 0, "speed/wps": 5530.621053537186, "speed/FLOPS": 244425142281583.44, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.44, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04822482168674469, "optim/lr": 2.6437468629228133e-05, "optim/total_tokens": 1942365405184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2872910499572754, "created_at": "2025-06-03T04:51:33.959461+00:00"} {"global_step": 231549, "acc_step": 0, "speed/wps": 5517.843087112761, "speed/FLOPS": 243860421569185.0, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04401041194796562, "optim/lr": 2.6433921404133587e-05, "optim/total_tokens": 1942373793792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2983667850494385, "created_at": "2025-06-03T04:51:36.935754+00:00"} {"global_step": 231550, "acc_step": 0, "speed/wps": 5527.8674104112715, "speed/FLOPS": 244303445349841.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04521603882312775, "optim/lr": 2.643037417903904e-05, "optim/total_tokens": 1942382182400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2923130989074707, "created_at": "2025-06-03T04:51:39.903660+00:00"} {"global_step": 231551, "acc_step": 0, "speed/wps": 5516.759981844297, "speed/FLOPS": 243812553860154.22, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041181620210409164, "optim/lr": 2.6426826953944494e-05, "optim/total_tokens": 1942390571008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.30459463596344, "created_at": "2025-06-03T04:51:42.879953+00:00"} {"global_step": 231552, "acc_step": 0, "speed/wps": 5512.8659078888195, "speed/FLOPS": 243640455722999.47, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04461268335580826, "optim/lr": 2.6423279728850168e-05, "optim/total_tokens": 1942398959616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2963343858718872, "created_at": "2025-06-03T04:51:45.857530+00:00"} {"global_step": 231553, "acc_step": 0, "speed/wps": 5509.969952294237, "speed/FLOPS": 243512469308563.4, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.15 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.15, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04162544757127762, "optim/lr": 2.641973250375562e-05, "optim/total_tokens": 1942407348224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2960131168365479, "created_at": "2025-06-03T04:51:48.838214+00:00"} {"global_step": 231554, "acc_step": 0, "speed/wps": 5528.7496477576005, "speed/FLOPS": 244342435724848.88, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04889295622706413, "optim/lr": 2.6416185278661075e-05, "optim/total_tokens": 1942415736832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3004837036132812, "created_at": "2025-06-03T04:51:51.807819+00:00"} {"global_step": 231555, "acc_step": 0, "speed/wps": 5528.641238005106, "speed/FLOPS": 244337644568680.03, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044878505170345306, "optim/lr": 2.6412638053566752e-05, "optim/total_tokens": 1942424125440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2906211614608765, "created_at": "2025-06-03T04:51:54.776432+00:00"} {"global_step": 231556, "acc_step": 0, "speed/wps": 5538.026125167725, "speed/FLOPS": 244752408545060.72, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.24, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04359421879053116, "optim/lr": 2.6409090828472203e-05, "optim/total_tokens": 1942432514048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.304645299911499, "created_at": "2025-06-03T04:51:57.738730+00:00"} {"global_step": 231557, "acc_step": 0, "speed/wps": 5526.070896362544, "speed/FLOPS": 244224048624279.97, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04543300345540047, "optim/lr": 2.6405543603377656e-05, "optim/total_tokens": 1942440902656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3208073377609253, "created_at": "2025-06-03T04:52:00.710025+00:00"} {"global_step": 231558, "acc_step": 0, "speed/wps": 5528.197553626311, "speed/FLOPS": 244318035990119.8, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044329043477773666, "optim/lr": 2.640199637828311e-05, "optim/total_tokens": 1942449291264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2992082834243774, "created_at": "2025-06-03T04:52:03.680259+00:00"} {"global_step": 231559, "acc_step": 0, "speed/wps": 5528.944491588458, "speed/FLOPS": 244351046824871.66, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04625292494893074, "optim/lr": 2.6398449153188787e-05, "optim/total_tokens": 1942457679872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2752439975738525, "created_at": "2025-06-03T04:52:06.647341+00:00"} {"global_step": 231560, "acc_step": 0, "speed/wps": 5521.22354888092, "speed/FLOPS": 244009820676565.78, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04257582873106003, "optim/lr": 2.639490192809424e-05, "optim/total_tokens": 1942466068480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2955328226089478, "created_at": "2025-06-03T04:52:09.619542+00:00"} {"global_step": 231561, "acc_step": 0, "speed/wps": 5512.171119406092, "speed/FLOPS": 243609749628312.75, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.14 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.14, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.0452004075050354, "optim/lr": 2.6391354702999694e-05, "optim/total_tokens": 1942474457088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2907805442810059, "created_at": "2025-06-03T04:52:12.595700+00:00"} {"global_step": 231562, "acc_step": 0, "speed/wps": 5527.391304585665, "speed/FLOPS": 244282403909279.97, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.56, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04346638172864914, "optim/lr": 2.6387807477905144e-05, "optim/total_tokens": 1942482845696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.295727252960205, "created_at": "2025-06-03T04:52:15.567231+00:00"} {"global_step": 231563, "acc_step": 0, "speed/wps": 5525.72434277408, "speed/FLOPS": 244208732729491.9, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.044345706701278687, "optim/lr": 2.638426025281082e-05, "optim/total_tokens": 1942491234304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3079023361206055, "created_at": "2025-06-03T04:52:18.539611+00:00"} {"global_step": 231564, "acc_step": 0, "speed/wps": 5536.742758291777, "speed/FLOPS": 244695690298010.97, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04240424185991287, "optim/lr": 2.6380713027716275e-05, "optim/total_tokens": 1942499622912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3069652318954468, "created_at": "2025-06-03T04:52:21.503738+00:00"} {"global_step": 231565, "acc_step": 0, "speed/wps": 5524.920835046315, "speed/FLOPS": 244173221800650.1, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.042454808950424194, "optim/lr": 2.637716580262173e-05, "optim/total_tokens": 1942508011520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3007241487503052, "created_at": "2025-06-03T04:52:24.478059+00:00"} {"global_step": 231566, "acc_step": 0, "speed/wps": 5531.606026619051, "speed/FLOPS": 244468673050252.6, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.045416224747896194, "optim/lr": 2.6373618577527182e-05, "optim/total_tokens": 1942516400128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2967416048049927, "created_at": "2025-06-03T04:52:27.448562+00:00"} {"global_step": 231567, "acc_step": 0, "speed/wps": 5519.458883870818, "speed/FLOPS": 243931831515493.56, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04358226805925369, "optim/lr": 2.6370071352432856e-05, "optim/total_tokens": 1942524788736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.283109426498413, "created_at": "2025-06-03T04:52:30.421857+00:00"} {"global_step": 231568, "acc_step": 0, "speed/wps": 5517.825225600937, "speed/FLOPS": 243859632181785.9, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.047478508204221725, "optim/lr": 2.636652412733831e-05, "optim/total_tokens": 1942533177344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2863225936889648, "created_at": "2025-06-03T04:52:33.395514+00:00"} {"global_step": 231569, "acc_step": 0, "speed/wps": 5514.117658423596, "speed/FLOPS": 243695776689596.56, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04224717617034912, "optim/lr": 2.6362976902243763e-05, "optim/total_tokens": 1942541565952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2896099090576172, "created_at": "2025-06-03T04:52:36.371504+00:00"} {"global_step": 231570, "acc_step": 0, "speed/wps": 5517.773524267484, "speed/FLOPS": 243857347247478.7, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.13 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.13, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.04536253586411476, "optim/lr": 2.6359429677149217e-05, "optim/total_tokens": 1942549954560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2933409214019775, "created_at": "2025-06-03T04:52:39.346979+00:00"} {"global_step": 231571, "acc_step": 0, "speed/wps": 5526.234846523986, "speed/FLOPS": 244231294382242.7, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043898943811655045, "optim/lr": 2.635588245205489e-05, "optim/total_tokens": 1942558343168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2880253791809082, "created_at": "2025-06-03T04:52:42.319661+00:00"} {"global_step": 231572, "acc_step": 0, "speed/wps": 5525.001080822716, "speed/FLOPS": 244176768253231.9, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042306073009967804, "optim/lr": 2.6352335226960345e-05, "optim/total_tokens": 1942566731776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2894089221954346, "created_at": "2025-06-03T04:52:45.289588+00:00"} {"global_step": 231573, "acc_step": 0, "speed/wps": 5532.938373690321, "speed/FLOPS": 244527555971232.25, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04124952107667923, "optim/lr": 2.6348788001865798e-05, "optim/total_tokens": 1942575120384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2914918661117554, "created_at": "2025-06-03T04:52:48.254831+00:00"} {"global_step": 231574, "acc_step": 0, "speed/wps": 5530.431708482011, "speed/FLOPS": 244416774199300.56, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04164881631731987, "optim/lr": 2.6345240776771252e-05, "optim/total_tokens": 1942583508992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3001707792282104, "created_at": "2025-06-03T04:52:51.221870+00:00"} {"global_step": 231575, "acc_step": 0, "speed/wps": 5529.460662404175, "speed/FLOPS": 244373858932924.62, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043680936098098755, "optim/lr": 2.6341693551676926e-05, "optim/total_tokens": 1942591897600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2747231721878052, "created_at": "2025-06-03T04:52:54.189492+00:00"} {"global_step": 231576, "acc_step": 0, "speed/wps": 5520.247188901233, "speed/FLOPS": 243966670562927.0, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04805263504385948, "optim/lr": 2.633814632658238e-05, "optim/total_tokens": 1942600286208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3030834197998047, "created_at": "2025-06-03T04:52:57.164283+00:00"} {"global_step": 231577, "acc_step": 0, "speed/wps": 5526.508419920213, "speed/FLOPS": 244243384926080.34, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04375719279050827, "optim/lr": 2.6334599101487833e-05, "optim/total_tokens": 1942608674816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2929494380950928, "created_at": "2025-06-03T04:53:00.133322+00:00"} {"global_step": 231578, "acc_step": 0, "speed/wps": 5516.793819730947, "speed/FLOPS": 243814049321546.12, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.26, "optim/grad_norm": 0.041953664273023605, "optim/lr": 2.6331051876393286e-05, "optim/total_tokens": 1942617063424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2838432788848877, "created_at": "2025-06-03T04:53:03.111963+00:00"} {"global_step": 231579, "acc_step": 0, "speed/wps": 5522.628631456207, "speed/FLOPS": 244071918134528.84, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043656717985868454, "optim/lr": 2.632750465129896e-05, "optim/total_tokens": 1942625452032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2846057415008545, "created_at": "2025-06-03T04:53:06.082849+00:00"} {"global_step": 231580, "acc_step": 0, "speed/wps": 5518.855787961004, "speed/FLOPS": 243905177763204.53, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042434919625520706, "optim/lr": 2.6323957426204414e-05, "optim/total_tokens": 1942633840640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3022745847702026, "created_at": "2025-06-03T04:53:09.057028+00:00"} {"global_step": 231581, "acc_step": 0, "speed/wps": 5532.406697785389, "speed/FLOPS": 244504058617598.22, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04279814660549164, "optim/lr": 2.6320410201109867e-05, "optim/total_tokens": 1942642229248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2981665134429932, "created_at": "2025-06-03T04:53:12.022477+00:00"} {"global_step": 231582, "acc_step": 0, "speed/wps": 5522.585572524502, "speed/FLOPS": 244070015150143.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042669977992773056, "optim/lr": 2.6316862976015545e-05, "optim/total_tokens": 1942650617856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3012949228286743, "created_at": "2025-06-03T04:53:14.993533+00:00"} {"global_step": 231583, "acc_step": 0, "speed/wps": 5524.622003497183, "speed/FLOPS": 244160014975736.97, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042064618319272995, "optim/lr": 2.6313315750920995e-05, "optim/total_tokens": 1942659006464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2976419925689697, "created_at": "2025-06-03T04:53:17.966556+00:00"} {"global_step": 231584, "acc_step": 0, "speed/wps": 5519.366645864404, "speed/FLOPS": 243927755067727.0, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04750816524028778, "optim/lr": 2.630976852582645e-05, "optim/total_tokens": 1942667395072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2765661478042603, "created_at": "2025-06-03T04:53:20.939218+00:00"} {"global_step": 231585, "acc_step": 0, "speed/wps": 5518.99394239661, "speed/FLOPS": 243911283482119.78, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044125065207481384, "optim/lr": 2.6306221300731902e-05, "optim/total_tokens": 1942675783680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3008325099945068, "created_at": "2025-06-03T04:53:23.913695+00:00"} {"global_step": 231586, "acc_step": 0, "speed/wps": 5527.028388971312, "speed/FLOPS": 244266364896696.06, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04308013617992401, "optim/lr": 2.630267407563758e-05, "optim/total_tokens": 1942684172288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3011006116867065, "created_at": "2025-06-03T04:53:26.882204+00:00"} {"global_step": 231587, "acc_step": 0, "speed/wps": 5512.613342167846, "speed/FLOPS": 243629293610881.0, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04267962649464607, "optim/lr": 2.6299126850543033e-05, "optim/total_tokens": 1942692560896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2932425737380981, "created_at": "2025-06-03T04:53:29.858268+00:00"} {"global_step": 231588, "acc_step": 0, "speed/wps": 5533.340162604823, "speed/FLOPS": 244545312984711.12, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04263468086719513, "optim/lr": 2.6295579625448483e-05, "optim/total_tokens": 1942700949504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.305181622505188, "created_at": "2025-06-03T04:53:32.828638+00:00"} {"global_step": 231589, "acc_step": 0, "speed/wps": 5528.210989085772, "speed/FLOPS": 244318629768659.06, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04249105602502823, "optim/lr": 2.6292032400353937e-05, "optim/total_tokens": 1942709338112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2934964895248413, "created_at": "2025-06-03T04:53:35.796555+00:00"} {"global_step": 231590, "acc_step": 0, "speed/wps": 5523.383459586922, "speed/FLOPS": 244105277674345.88, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04218631982803345, "optim/lr": 2.6288485175259614e-05, "optim/total_tokens": 1942717726720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2936066389083862, "created_at": "2025-06-03T04:53:38.767747+00:00"} {"global_step": 231591, "acc_step": 0, "speed/wps": 5523.751187882149, "speed/FLOPS": 244121529382790.84, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04275186359882355, "optim/lr": 2.6284937950165068e-05, "optim/total_tokens": 1942726115328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2903558015823364, "created_at": "2025-06-03T04:53:41.740694+00:00"} {"global_step": 231592, "acc_step": 0, "speed/wps": 5510.478758610676, "speed/FLOPS": 243534955943443.16, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04273751750588417, "optim/lr": 2.628139072507052e-05, "optim/total_tokens": 1942734503936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.269704818725586, "created_at": "2025-06-03T04:53:44.719793+00:00"} {"global_step": 231593, "acc_step": 0, "speed/wps": 5522.432680102647, "speed/FLOPS": 244063258087671.47, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04263181984424591, "optim/lr": 2.627784349997597e-05, "optim/total_tokens": 1942742892544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.3104685544967651, "created_at": "2025-06-03T04:53:47.690406+00:00"} {"global_step": 231594, "acc_step": 0, "speed/wps": 5509.738283138658, "speed/FLOPS": 243502230717677.0, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.12 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.12, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04289337992668152, "optim/lr": 2.627429627488165e-05, "optim/total_tokens": 1942751281152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2873685359954834, "created_at": "2025-06-03T04:53:50.667807+00:00"} {"global_step": 231595, "acc_step": 0, "speed/wps": 5511.570556499002, "speed/FLOPS": 243583207821779.0, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04273340106010437, "optim/lr": 2.6270749049787102e-05, "optim/total_tokens": 1942759669760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.3084384202957153, "created_at": "2025-06-03T04:53:53.644128+00:00"} {"global_step": 231596, "acc_step": 0, "speed/wps": 5528.908191253397, "speed/FLOPS": 244349442535863.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04224303364753723, "optim/lr": 2.6267201824692556e-05, "optim/total_tokens": 1942768058368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3015190362930298, "created_at": "2025-06-03T04:53:56.615108+00:00"} {"global_step": 231597, "acc_step": 0, "speed/wps": 5537.8603349705, "speed/FLOPS": 244745081466934.53, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.28, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04208306223154068, "optim/lr": 2.626365459959801e-05, "optim/total_tokens": 1942776446976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3088421821594238, "created_at": "2025-06-03T04:53:59.580448+00:00"} {"global_step": 231598, "acc_step": 0, "speed/wps": 5530.803148464425, "speed/FLOPS": 244433189945321.1, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04278511554002762, "optim/lr": 2.6260107374503683e-05, "optim/total_tokens": 1942784835584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2995402812957764, "created_at": "2025-06-03T04:54:02.550890+00:00"} {"global_step": 231599, "acc_step": 0, "speed/wps": 5524.333596346863, "speed/FLOPS": 244147268855894.44, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04372912645339966, "optim/lr": 2.6256560149409137e-05, "optim/total_tokens": 1942793224192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.296733021736145, "created_at": "2025-06-03T04:54:05.520775+00:00"} {"global_step": 231600, "acc_step": 0, "speed/wps": 5528.479609485203, "speed/FLOPS": 244330501415390.06, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04203997179865837, "optim/lr": 2.625301292431459e-05, "optim/total_tokens": 1942801612800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2755305767059326, "created_at": "2025-06-03T04:54:08.491336+00:00"} {"global_step": 231601, "acc_step": 0, "speed/wps": 5525.126819712314, "speed/FLOPS": 244182325268562.12, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0442064106464386, "optim/lr": 2.6249465699220044e-05, "optim/total_tokens": 1942810001408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2965236902236938, "created_at": "2025-06-03T04:54:11.461175+00:00"} {"global_step": 231602, "acc_step": 0, "speed/wps": 5518.141318149188, "speed/FLOPS": 243873601854510.25, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0415717177093029, "optim/lr": 2.6245918474125718e-05, "optim/total_tokens": 1942818390016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.305382490158081, "created_at": "2025-06-03T04:54:14.437372+00:00"} {"global_step": 231603, "acc_step": 0, "speed/wps": 5516.9228073146705, "speed/FLOPS": 243819749912528.4, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04247114062309265, "optim/lr": 2.624237124903117e-05, "optim/total_tokens": 1942826778624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2963520288467407, "created_at": "2025-06-03T04:54:17.412558+00:00"} {"global_step": 231604, "acc_step": 0, "speed/wps": 5510.8722408878175, "speed/FLOPS": 243552345846067.94, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 191.22, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04183570295572281, "optim/lr": 2.6238824023936625e-05, "optim/total_tokens": 1942835167232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.308123230934143, "created_at": "2025-06-03T04:54:20.392965+00:00"} {"global_step": 231605, "acc_step": 0, "speed/wps": 5505.260312028405, "speed/FLOPS": 243304327314937.75, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.11 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.11, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0451233834028244, "optim/lr": 2.623527679884208e-05, "optim/total_tokens": 1942843555840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.298761010169983, "created_at": "2025-06-03T04:54:23.377795+00:00"} {"global_step": 231606, "acc_step": 0, "speed/wps": 5519.3426644270985, "speed/FLOPS": 243926695210946.22, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0446908175945282, "optim/lr": 2.6231729573747753e-05, "optim/total_tokens": 1942851944448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2867337465286255, "created_at": "2025-06-03T04:54:26.350178+00:00"} {"global_step": 231607, "acc_step": 0, "speed/wps": 5523.231928447372, "speed/FLOPS": 244098580773584.44, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041862230747938156, "optim/lr": 2.6228182348653206e-05, "optim/total_tokens": 1942860333056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2980177402496338, "created_at": "2025-06-03T04:54:29.324533+00:00"} {"global_step": 231608, "acc_step": 0, "speed/wps": 5520.251329287828, "speed/FLOPS": 243966853546822.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04213012382388115, "optim/lr": 2.622463512355866e-05, "optim/total_tokens": 1942868721664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2913892269134521, "created_at": "2025-06-03T04:54:32.299223+00:00"} {"global_step": 231609, "acc_step": 0, "speed/wps": 5510.114499985116, "speed/FLOPS": 243518857576638.06, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04199724271893501, "optim/lr": 2.6221087898464334e-05, "optim/total_tokens": 1942877110272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2908416986465454, "created_at": "2025-06-03T04:54:35.277866+00:00"} {"global_step": 231610, "acc_step": 0, "speed/wps": 5515.137245465523, "speed/FLOPS": 243740837218130.12, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044672925025224686, "optim/lr": 2.6217540673369787e-05, "optim/total_tokens": 1942885498880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2936559915542603, "created_at": "2025-06-03T04:54:38.257427+00:00"} {"global_step": 231611, "acc_step": 0, "speed/wps": 5512.822193865051, "speed/FLOPS": 243638523786897.56, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04156416654586792, "optim/lr": 2.621399344827524e-05, "optim/total_tokens": 1942893887488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3011575937271118, "created_at": "2025-06-03T04:54:41.232965+00:00"} {"global_step": 231612, "acc_step": 0, "speed/wps": 5512.374850379025, "speed/FLOPS": 243618753494526.72, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04320788383483887, "optim/lr": 2.6210446223180694e-05, "optim/total_tokens": 1942902276096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3017137050628662, "created_at": "2025-06-03T04:54:44.212417+00:00"} {"global_step": 231613, "acc_step": 0, "speed/wps": 5513.982936228727, "speed/FLOPS": 243689822658154.06, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.046292711049318314, "optim/lr": 2.620689899808637e-05, "optim/total_tokens": 1942910664704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2923580408096313, "created_at": "2025-06-03T04:54:47.191434+00:00"} {"global_step": 231614, "acc_step": 0, "speed/wps": 5535.570477532098, "speed/FLOPS": 244643881488710.03, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.37, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041732657700777054, "optim/lr": 2.6203351772991825e-05, "optim/total_tokens": 1942919053312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.299742341041565, "created_at": "2025-06-03T04:54:50.156664+00:00"} {"global_step": 231615, "acc_step": 0, "speed/wps": 5517.777885495737, "speed/FLOPS": 243857539991444.66, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0486900769174099, "optim/lr": 2.6199804547897275e-05, "optim/total_tokens": 1942927441920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2992817163467407, "created_at": "2025-06-03T04:54:53.130165+00:00"} {"global_step": 231616, "acc_step": 0, "speed/wps": 5520.224265103484, "speed/FLOPS": 243965657448401.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04434822499752045, "optim/lr": 2.619625732280273e-05, "optim/total_tokens": 1942935830528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3130323886871338, "created_at": "2025-06-03T04:54:56.101931+00:00"} {"global_step": 231617, "acc_step": 0, "speed/wps": 5528.519829828202, "speed/FLOPS": 244332278948684.28, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.62, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04435703158378601, "optim/lr": 2.6192710097708406e-05, "optim/total_tokens": 1942944219136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2998992204666138, "created_at": "2025-06-03T04:54:59.069600+00:00"} {"global_step": 231618, "acc_step": 0, "speed/wps": 5502.362528441196, "speed/FLOPS": 243176260112584.1, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05332488194108009, "optim/lr": 2.618916287261386e-05, "optim/total_tokens": 1942952607744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3142330646514893, "created_at": "2025-06-03T04:55:02.054218+00:00"} {"global_step": 231619, "acc_step": 0, "speed/wps": 5517.514020233062, "speed/FLOPS": 243845878497419.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04393138736486435, "optim/lr": 2.6185615647519314e-05, "optim/total_tokens": 1942960996352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2888346910476685, "created_at": "2025-06-03T04:55:05.030011+00:00"} {"global_step": 231620, "acc_step": 0, "speed/wps": 5521.392704008531, "speed/FLOPS": 244017296467391.75, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0515170693397522, "optim/lr": 2.6182068422424764e-05, "optim/total_tokens": 1942969384960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3036260604858398, "created_at": "2025-06-03T04:55:08.001251+00:00"} {"global_step": 231621, "acc_step": 0, "speed/wps": 5505.790815833965, "speed/FLOPS": 243327772867778.88, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.1 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.1, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042477674782276154, "optim/lr": 2.617852119733044e-05, "optim/total_tokens": 1942977773568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2858058214187622, "created_at": "2025-06-03T04:55:10.981428+00:00"} {"global_step": 231622, "acc_step": 0, "speed/wps": 5519.810513239588, "speed/FLOPS": 243947371733790.94, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04564902186393738, "optim/lr": 2.6174973972235895e-05, "optim/total_tokens": 1942986162176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2945334911346436, "created_at": "2025-06-03T04:55:13.953602+00:00"} {"global_step": 231623, "acc_step": 0, "speed/wps": 5529.047774778693, "speed/FLOPS": 244355611413228.72, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04313359037041664, "optim/lr": 2.6171426747141348e-05, "optim/total_tokens": 1942994550784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2917660474777222, "created_at": "2025-06-03T04:55:16.920698+00:00"} {"global_step": 231624, "acc_step": 0, "speed/wps": 5523.471054983956, "speed/FLOPS": 244109148942540.84, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044746700674295425, "optim/lr": 2.6167879522046802e-05, "optim/total_tokens": 1943002939392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2899432182312012, "created_at": "2025-06-03T04:55:19.890628+00:00"} {"global_step": 231625, "acc_step": 0, "speed/wps": 5509.092869648293, "speed/FLOPS": 243473706744928.62, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043576985597610474, "optim/lr": 2.6164332296952476e-05, "optim/total_tokens": 1943011328000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2932742834091187, "created_at": "2025-06-03T04:55:22.868347+00:00"} {"global_step": 231626, "acc_step": 0, "speed/wps": 5517.932451357602, "speed/FLOPS": 243864371011399.3, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043716657906770706, "optim/lr": 2.616078507185793e-05, "optim/total_tokens": 1943019716608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3024442195892334, "created_at": "2025-06-03T04:55:25.842772+00:00"} {"global_step": 231627, "acc_step": 0, "speed/wps": 5522.578871051854, "speed/FLOPS": 244069718979353.28, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04187648370862007, "optim/lr": 2.6157237846763383e-05, "optim/total_tokens": 1943028105216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2938016653060913, "created_at": "2025-06-03T04:55:28.817711+00:00"} {"global_step": 231628, "acc_step": 0, "speed/wps": 5516.921817258742, "speed/FLOPS": 243819706157123.94, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04576672613620758, "optim/lr": 2.6153690621668836e-05, "optim/total_tokens": 1943036493824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2990716695785522, "created_at": "2025-06-03T04:55:31.791768+00:00"} {"global_step": 231629, "acc_step": 0, "speed/wps": 5511.759307305007, "speed/FLOPS": 243591549641290.2, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047250211238861084, "optim/lr": 2.615014339657451e-05, "optim/total_tokens": 1943044882432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.308573603630066, "created_at": "2025-06-03T04:55:34.772393+00:00"} {"global_step": 231630, "acc_step": 0, "speed/wps": 5528.33083187826, "speed/FLOPS": 244323926206676.03, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0468255952000618, "optim/lr": 2.6146596171479964e-05, "optim/total_tokens": 1943053271040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2871216535568237, "created_at": "2025-06-03T04:55:37.740222+00:00"} {"global_step": 231631, "acc_step": 0, "speed/wps": 5516.943402202177, "speed/FLOPS": 243820660101142.0, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.059093233197927475, "optim/lr": 2.6143048946385417e-05, "optim/total_tokens": 1943061659648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3114131689071655, "created_at": "2025-06-03T04:55:40.717532+00:00"} {"global_step": 231632, "acc_step": 0, "speed/wps": 5519.282967588234, "speed/FLOPS": 243924056916224.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04256273806095123, "optim/lr": 2.613950172129087e-05, "optim/total_tokens": 1943070048256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2864001989364624, "created_at": "2025-06-03T04:55:43.694147+00:00"} {"global_step": 231633, "acc_step": 0, "speed/wps": 5521.681070627716, "speed/FLOPS": 244030040795965.53, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.055382706224918365, "optim/lr": 2.6135954496196545e-05, "optim/total_tokens": 1943078436864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.277144432067871, "created_at": "2025-06-03T04:55:46.665493+00:00"} {"global_step": 231634, "acc_step": 0, "speed/wps": 5524.54477313457, "speed/FLOPS": 244156601789010.34, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04600627347826958, "optim/lr": 2.6132407271102e-05, "optim/total_tokens": 1943086825472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.301171898841858, "created_at": "2025-06-03T04:55:49.634964+00:00"} {"global_step": 231635, "acc_step": 0, "speed/wps": 5516.844443475689, "speed/FLOPS": 243816286631947.94, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.046141378581523895, "optim/lr": 2.6128860046007452e-05, "optim/total_tokens": 1943095214080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3039788007736206, "created_at": "2025-06-03T04:55:52.608466+00:00"} {"global_step": 231636, "acc_step": 0, "speed/wps": 5518.421473271494, "speed/FLOPS": 243885983276952.25, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044947024434804916, "optim/lr": 2.6125312820913126e-05, "optim/total_tokens": 1943103602688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2863274812698364, "created_at": "2025-06-03T04:55:55.583070+00:00"} {"global_step": 231637, "acc_step": 0, "speed/wps": 5504.238679377156, "speed/FLOPS": 243259176380942.47, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.09 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.09, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0428461916744709, "optim/lr": 2.612176559581858e-05, "optim/total_tokens": 1943111991296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.292608618736267, "created_at": "2025-06-03T04:55:58.564046+00:00"} {"global_step": 231638, "acc_step": 0, "speed/wps": 5512.082540538405, "speed/FLOPS": 243605834895748.72, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04423374682664871, "optim/lr": 2.6118218370724033e-05, "optim/total_tokens": 1943120379904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2866078615188599, "created_at": "2025-06-03T04:56:01.544114+00:00"} {"global_step": 231639, "acc_step": 0, "speed/wps": 5518.534862054414, "speed/FLOPS": 243890994480780.9, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05025423690676689, "optim/lr": 2.6114671145629487e-05, "optim/total_tokens": 1943128768512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3063325881958008, "created_at": "2025-06-03T04:56:04.517311+00:00"} {"global_step": 231640, "acc_step": 0, "speed/wps": 5522.722549733507, "speed/FLOPS": 244076068841668.2, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04299495369195938, "optim/lr": 2.6111123920535164e-05, "optim/total_tokens": 1943137157120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3056466579437256, "created_at": "2025-06-03T04:56:07.487595+00:00"} {"global_step": 231641, "acc_step": 0, "speed/wps": 5518.887521143333, "speed/FLOPS": 243906580207438.3, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04224203899502754, "optim/lr": 2.6107576695440614e-05, "optim/total_tokens": 1943145545728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3078234195709229, "created_at": "2025-06-03T04:56:10.463896+00:00"} {"global_step": 231642, "acc_step": 0, "speed/wps": 5519.778817935415, "speed/FLOPS": 243945970963577.78, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04282332584261894, "optim/lr": 2.6104029470346068e-05, "optim/total_tokens": 1943153934336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2892431020736694, "created_at": "2025-06-03T04:56:13.436206+00:00"} {"global_step": 231643, "acc_step": 0, "speed/wps": 5522.822239595926, "speed/FLOPS": 244080474623328.12, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04273122176527977, "optim/lr": 2.610048224525152e-05, "optim/total_tokens": 1943162322944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2786585092544556, "created_at": "2025-06-03T04:56:16.406442+00:00"} {"global_step": 231644, "acc_step": 0, "speed/wps": 5506.779745778827, "speed/FLOPS": 243371478509539.47, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04231277480721474, "optim/lr": 2.60969350201572e-05, "optim/total_tokens": 1943170711552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2873620986938477, "created_at": "2025-06-03T04:56:19.387676+00:00"} {"global_step": 231645, "acc_step": 0, "speed/wps": 5509.466334279503, "speed/FLOPS": 243490211970062.8, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04309212416410446, "optim/lr": 2.6093387795062652e-05, "optim/total_tokens": 1943179100160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2978870868682861, "created_at": "2025-06-03T04:56:22.365482+00:00"} {"global_step": 231646, "acc_step": 0, "speed/wps": 5506.185540538022, "speed/FLOPS": 243345217679314.0, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041923269629478455, "optim/lr": 2.6089840569968102e-05, "optim/total_tokens": 1943187488768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3034173250198364, "created_at": "2025-06-03T04:56:25.345222+00:00"} {"global_step": 231647, "acc_step": 0, "speed/wps": 5506.471737854687, "speed/FLOPS": 243357866135819.9, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0433092899620533, "optim/lr": 2.6086293344873556e-05, "optim/total_tokens": 1943195877376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2927626371383667, "created_at": "2025-06-03T04:56:28.324451+00:00"} {"global_step": 231648, "acc_step": 0, "speed/wps": 5505.613286836318, "speed/FLOPS": 243319926994758.7, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04305526241660118, "optim/lr": 2.6082746119779233e-05, "optim/total_tokens": 1943204265984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.276214599609375, "created_at": "2025-06-03T04:56:31.305235+00:00"} {"global_step": 231649, "acc_step": 0, "speed/wps": 5521.019412392851, "speed/FLOPS": 244000798888658.4, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04158527031540871, "optim/lr": 2.6079198894684687e-05, "optim/total_tokens": 1943212654592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2960882186889648, "created_at": "2025-06-03T04:56:34.278322+00:00"} {"global_step": 231650, "acc_step": 0, "speed/wps": 5513.968435236293, "speed/FLOPS": 243689181788511.25, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04255323112010956, "optim/lr": 2.607565166959014e-05, "optim/total_tokens": 1943221043200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3070979118347168, "created_at": "2025-06-03T04:56:37.254314+00:00"} {"global_step": 231651, "acc_step": 0, "speed/wps": 5516.586509346354, "speed/FLOPS": 243804887263657.9, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04194260761141777, "optim/lr": 2.607210444449559e-05, "optim/total_tokens": 1943229431808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2975566387176514, "created_at": "2025-06-03T04:56:40.229749+00:00"} {"global_step": 231652, "acc_step": 0, "speed/wps": 5507.586371938914, "speed/FLOPS": 243407127257128.34, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041504841297864914, "optim/lr": 2.6068557219401268e-05, "optim/total_tokens": 1943237820416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.30048406124115, "created_at": "2025-06-03T04:56:43.211297+00:00"} {"global_step": 231653, "acc_step": 0, "speed/wps": 5496.763270838528, "speed/FLOPS": 242928801586144.62, "speed/curr_iter_time": 2.979, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.979, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "6.08 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 6.08, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04286417365074158, "optim/lr": 2.606500999430672e-05, "optim/total_tokens": 1943246209024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.302413821220398, "created_at": "2025-06-03T04:56:46.200422+00:00"} {"global_step": 231654, "acc_step": 0, "speed/wps": 5509.482207919809, "speed/FLOPS": 243490913503715.7, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04564767703413963, "optim/lr": 2.6061462769212175e-05, "optim/total_tokens": 1943254597632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3005181550979614, "created_at": "2025-06-03T04:56:49.178294+00:00"} {"global_step": 231655, "acc_step": 0, "speed/wps": 5518.239348889399, "speed/FLOPS": 243877934311460.75, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04164223000407219, "optim/lr": 2.605791554411763e-05, "optim/total_tokens": 1943262986240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2945761680603027, "created_at": "2025-06-03T04:56:52.151467+00:00"} {"global_step": 231656, "acc_step": 0, "speed/wps": 5527.899583421381, "speed/FLOPS": 244304867232211.7, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043654222041368484, "optim/lr": 2.6054368319023303e-05, "optim/total_tokens": 1943271374848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2904568910598755, "created_at": "2025-06-03T04:56:55.124032+00:00"} {"global_step": 231657, "acc_step": 0, "speed/wps": 5517.624257598689, "speed/FLOPS": 243850750424734.0, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04422828555107117, "optim/lr": 2.6050821093928756e-05, "optim/total_tokens": 1943279763456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3064627647399902, "created_at": "2025-06-03T04:56:58.097622+00:00"} {"global_step": 231658, "acc_step": 0, "speed/wps": 5524.209443064428, "speed/FLOPS": 244141781916284.94, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042847711592912674, "optim/lr": 2.604727386883421e-05, "optim/total_tokens": 1943288152064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3026715517044067, "created_at": "2025-06-03T04:57:01.067348+00:00"} {"global_step": 231659, "acc_step": 0, "speed/wps": 5509.947621571599, "speed/FLOPS": 243511482404921.75, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04301240295171738, "optim/lr": 2.6043726643739663e-05, "optim/total_tokens": 1943296540672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.292984962463379, "created_at": "2025-06-03T04:57:04.044555+00:00"} {"global_step": 231660, "acc_step": 0, "speed/wps": 5519.382818170544, "speed/FLOPS": 243928469800881.03, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042735688388347626, "optim/lr": 2.6040179418645337e-05, "optim/total_tokens": 1943304929280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2855874300003052, "created_at": "2025-06-03T04:57:07.021649+00:00"} {"global_step": 231661, "acc_step": 0, "speed/wps": 5497.493771388279, "speed/FLOPS": 242961085971402.88, "speed/curr_iter_time": 2.9795, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9795, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04202667251229286, "optim/lr": 2.603663219355079e-05, "optim/total_tokens": 1943313317888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2890070676803589, "created_at": "2025-06-03T04:57:10.010129+00:00"} {"global_step": 231662, "acc_step": 0, "speed/wps": 5524.9972079001745, "speed/FLOPS": 244176597089878.97, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04447101056575775, "optim/lr": 2.6033084968456244e-05, "optim/total_tokens": 1943321706496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.267324686050415, "created_at": "2025-06-03T04:57:12.983392+00:00"} {"global_step": 231663, "acc_step": 0, "speed/wps": 5505.396552598493, "speed/FLOPS": 243310348450793.2, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.06 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.06, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04664819315075874, "optim/lr": 2.602953774336192e-05, "optim/total_tokens": 1943330095104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3044235706329346, "created_at": "2025-06-03T04:57:15.963740+00:00"} {"global_step": 231664, "acc_step": 0, "speed/wps": 5513.187949618681, "speed/FLOPS": 243654688319100.34, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04519740864634514, "optim/lr": 2.6025990518267372e-05, "optim/total_tokens": 1943338483712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2968300580978394, "created_at": "2025-06-03T04:57:18.939260+00:00"} {"global_step": 231665, "acc_step": 0, "speed/wps": 5522.434479980914, "speed/FLOPS": 244063337633078.25, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04351875185966492, "optim/lr": 2.6022443293172826e-05, "optim/total_tokens": 1943346872320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3014945983886719, "created_at": "2025-06-03T04:57:21.914904+00:00"} {"global_step": 231666, "acc_step": 0, "speed/wps": 5518.327783444563, "speed/FLOPS": 243881842666149.9, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042162202298641205, "optim/lr": 2.601889606807828e-05, "optim/total_tokens": 1943355260928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3029365539550781, "created_at": "2025-06-03T04:57:24.888257+00:00"} {"global_step": 231667, "acc_step": 0, "speed/wps": 5526.334052583062, "speed/FLOPS": 244235678782271.22, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.06385425478219986, "optim/lr": 2.6015348842983953e-05, "optim/total_tokens": 1943363649536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3008605241775513, "created_at": "2025-06-03T04:57:27.857740+00:00"} {"global_step": 231668, "acc_step": 0, "speed/wps": 5515.556879837599, "speed/FLOPS": 243759382909492.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04297548905014992, "optim/lr": 2.6011801617889407e-05, "optim/total_tokens": 1943372038144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.276442289352417, "created_at": "2025-06-03T04:57:30.832462+00:00"} {"global_step": 231669, "acc_step": 0, "speed/wps": 5509.053531834691, "speed/FLOPS": 243471968214916.56, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042352139949798584, "optim/lr": 2.600825439279486e-05, "optim/total_tokens": 1943380426752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2981479167938232, "created_at": "2025-06-03T04:57:33.814452+00:00"} {"global_step": 231670, "acc_step": 0, "speed/wps": 5508.813801466542, "speed/FLOPS": 243461373359695.66, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04390125349164009, "optim/lr": 2.6004707167700314e-05, "optim/total_tokens": 1943388815360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2992497682571411, "created_at": "2025-06-03T04:57:36.798268+00:00"} {"global_step": 231671, "acc_step": 0, "speed/wps": 5494.808802280858, "speed/FLOPS": 242842424079772.56, "speed/curr_iter_time": 2.981, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.981, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "6.07 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 6.07, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042856208980083466, "optim/lr": 2.600115994260599e-05, "optim/total_tokens": 1943397203968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2770819664001465, "created_at": "2025-06-03T04:57:39.788691+00:00"} {"global_step": 231672, "acc_step": 0, "speed/wps": 5524.446642712712, "speed/FLOPS": 244152264926641.22, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04223938286304474, "optim/lr": 2.5997612717511445e-05, "optim/total_tokens": 1943405592576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3121256828308105, "created_at": "2025-06-03T04:57:42.759075+00:00"} {"global_step": 231673, "acc_step": 0, "speed/wps": 5513.422455916557, "speed/FLOPS": 243665052297154.4, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042067062109708786, "optim/lr": 2.5994065492416895e-05, "optim/total_tokens": 1943413981184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2892227172851562, "created_at": "2025-06-03T04:57:45.735367+00:00"} {"global_step": 231674, "acc_step": 0, "speed/wps": 5528.7813158524195, "speed/FLOPS": 244343835292547.88, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042586568742990494, "optim/lr": 2.599051826732235e-05, "optim/total_tokens": 1943422369792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2845484018325806, "created_at": "2025-06-03T04:57:48.703648+00:00"} {"global_step": 231675, "acc_step": 0, "speed/wps": 5518.721699763014, "speed/FLOPS": 243899251751178.97, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04189351201057434, "optim/lr": 2.5986971042228026e-05, "optim/total_tokens": 1943430758400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2745732069015503, "created_at": "2025-06-03T04:57:51.676438+00:00"} {"global_step": 231676, "acc_step": 0, "speed/wps": 5513.357314237086, "speed/FLOPS": 243662173368347.16, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042508695274591446, "optim/lr": 2.598342381713348e-05, "optim/total_tokens": 1943439147008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3004671335220337, "created_at": "2025-06-03T04:57:54.656586+00:00"} {"global_step": 231677, "acc_step": 0, "speed/wps": 5519.582240533927, "speed/FLOPS": 243937283248606.34, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04584326967597008, "optim/lr": 2.5979876592038933e-05, "optim/total_tokens": 1943447535616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3163810968399048, "created_at": "2025-06-03T04:57:57.629142+00:00"} {"global_step": 231678, "acc_step": 0, "speed/wps": 5507.38159347023, "speed/FLOPS": 243398077096963.72, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.05 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.05, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04191224277019501, "optim/lr": 2.5976329366944383e-05, "optim/total_tokens": 1943455924224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.296375036239624, "created_at": "2025-06-03T04:58:00.612432+00:00"} {"global_step": 231679, "acc_step": 0, "speed/wps": 5510.519577490372, "speed/FLOPS": 243536759928995.78, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042406391352415085, "optim/lr": 2.597278214185006e-05, "optim/total_tokens": 1943464312832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2905710935592651, "created_at": "2025-06-03T04:58:03.593954+00:00"} {"global_step": 231680, "acc_step": 0, "speed/wps": 5512.224258162035, "speed/FLOPS": 243612098089336.62, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04264422133564949, "optim/lr": 2.5969234916755514e-05, "optim/total_tokens": 1943472701440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.288209080696106, "created_at": "2025-06-03T04:58:06.573679+00:00"} {"global_step": 231681, "acc_step": 0, "speed/wps": 5513.643752575131, "speed/FLOPS": 243674832476764.4, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0424581840634346, "optim/lr": 2.5965687691660968e-05, "optim/total_tokens": 1943481090048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2898505926132202, "created_at": "2025-06-03T04:58:09.549228+00:00"} {"global_step": 231682, "acc_step": 0, "speed/wps": 5525.1069519181265, "speed/FLOPS": 244181447213751.66, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04232928529381752, "optim/lr": 2.596214046656642e-05, "optim/total_tokens": 1943489478656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2946839332580566, "created_at": "2025-06-03T04:58:12.518545+00:00"} {"global_step": 231683, "acc_step": 0, "speed/wps": 5512.414916189535, "speed/FLOPS": 243620524198275.84, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.04 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.04, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042163215577602386, "optim/lr": 2.5958593241472095e-05, "optim/total_tokens": 1943497867264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2850148677825928, "created_at": "2025-06-03T04:58:15.494570+00:00"} {"global_step": 231684, "acc_step": 0, "speed/wps": 5526.6200400450825, "speed/FLOPS": 244248317964276.0, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044500090181827545, "optim/lr": 2.595504601637755e-05, "optim/total_tokens": 1943506255872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.295665979385376, "created_at": "2025-06-03T04:58:18.464504+00:00"} {"global_step": 231685, "acc_step": 0, "speed/wps": 5527.75430042975, "speed/FLOPS": 244298446467607.38, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.7, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0436529666185379, "optim/lr": 2.5951498791283002e-05, "optim/total_tokens": 1943514644480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3062909841537476, "created_at": "2025-06-03T04:58:21.436638+00:00"} {"global_step": 231686, "acc_step": 0, "speed/wps": 5517.215876029528, "speed/FLOPS": 243832702049663.44, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04288455471396446, "optim/lr": 2.5947951566188456e-05, "optim/total_tokens": 1943523033088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3012051582336426, "created_at": "2025-06-03T04:58:24.414817+00:00"} {"global_step": 231687, "acc_step": 0, "speed/wps": 5516.597002508644, "speed/FLOPS": 243805351007722.25, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04200071841478348, "optim/lr": 2.594440434109413e-05, "optim/total_tokens": 1943531421696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2893972396850586, "created_at": "2025-06-03T04:58:27.388976+00:00"} {"global_step": 231688, "acc_step": 0, "speed/wps": 5513.617840942168, "speed/FLOPS": 243673687315215.22, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04347344860434532, "optim/lr": 2.5940857115999583e-05, "optim/total_tokens": 1943539810304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.312013864517212, "created_at": "2025-06-03T04:58:30.364219+00:00"} {"global_step": 231689, "acc_step": 0, "speed/wps": 5527.815248886786, "speed/FLOPS": 244301140077445.88, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04778663069009781, "optim/lr": 2.5937309890905037e-05, "optim/total_tokens": 1943548198912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3045058250427246, "created_at": "2025-06-03T04:58:33.331987+00:00"} {"global_step": 231690, "acc_step": 0, "speed/wps": 5516.927061661274, "speed/FLOPS": 243819937932872.56, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.045255329459905624, "optim/lr": 2.593376266581071e-05, "optim/total_tokens": 1943556587520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2940552234649658, "created_at": "2025-06-03T04:58:36.306383+00:00"} {"global_step": 231691, "acc_step": 0, "speed/wps": 5520.836234617227, "speed/FLOPS": 243992703368564.66, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04212011396884918, "optim/lr": 2.5930215440716164e-05, "optim/total_tokens": 1943564976128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2946540117263794, "created_at": "2025-06-03T04:58:39.278792+00:00"} {"global_step": 231692, "acc_step": 0, "speed/wps": 5521.392727836123, "speed/FLOPS": 244017297520449.38, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042607177048921585, "optim/lr": 2.5926668215621618e-05, "optim/total_tokens": 1943573364736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2934869527816772, "created_at": "2025-06-03T04:58:42.250114+00:00"} {"global_step": 231693, "acc_step": 0, "speed/wps": 5515.049145682504, "speed/FLOPS": 243736943658656.25, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042401500046253204, "optim/lr": 2.592312099052707e-05, "optim/total_tokens": 1943581753344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.288377285003662, "created_at": "2025-06-03T04:58:45.228868+00:00"} {"global_step": 231694, "acc_step": 0, "speed/wps": 5526.195928820897, "speed/FLOPS": 244229574418965.03, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04182638227939606, "optim/lr": 2.5919573765432745e-05, "optim/total_tokens": 1943590141952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2937829494476318, "created_at": "2025-06-03T04:58:48.201837+00:00"} {"global_step": 231695, "acc_step": 0, "speed/wps": 5512.194380520311, "speed/FLOPS": 243610777650500.06, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043006088584661484, "optim/lr": 2.59160265403382e-05, "optim/total_tokens": 1943598530560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2978756427764893, "created_at": "2025-06-03T04:58:51.177873+00:00"} {"global_step": 231696, "acc_step": 0, "speed/wps": 5514.5168355695605, "speed/FLOPS": 243713418276274.3, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04602089151740074, "optim/lr": 2.5912479315243653e-05, "optim/total_tokens": 1943606919168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2876900434494019, "created_at": "2025-06-03T04:58:54.157092+00:00"} {"global_step": 231697, "acc_step": 0, "speed/wps": 5524.489039328718, "speed/FLOPS": 244154138640063.12, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042929019778966904, "optim/lr": 2.5908932090149106e-05, "optim/total_tokens": 1943615307776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.283036708831787, "created_at": "2025-06-03T04:58:57.126336+00:00"} {"global_step": 231698, "acc_step": 0, "speed/wps": 5523.367922373439, "speed/FLOPS": 244104591009036.56, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043728142976760864, "optim/lr": 2.5905384865054783e-05, "optim/total_tokens": 1943623696384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2995109558105469, "created_at": "2025-06-03T04:59:00.099531+00:00"} {"global_step": 231699, "acc_step": 0, "speed/wps": 5532.851252980015, "speed/FLOPS": 244523705681760.9, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04476969689130783, "optim/lr": 2.5901837639960234e-05, "optim/total_tokens": 1943632084992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.293461561203003, "created_at": "2025-06-03T04:59:03.070065+00:00"} {"global_step": 231700, "acc_step": 0, "speed/wps": 5518.845933283915, "speed/FLOPS": 243904742236917.97, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04381031543016434, "optim/lr": 2.5898290414865687e-05, "optim/total_tokens": 1943640473600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2954511642456055, "created_at": "2025-06-03T04:59:06.047204+00:00"} {"global_step": 231701, "acc_step": 0, "speed/wps": 5511.477529098291, "speed/FLOPS": 243579096486824.94, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04207638278603554, "optim/lr": 2.589474318977114e-05, "optim/total_tokens": 1943648862208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2888355255126953, "created_at": "2025-06-03T04:59:09.027765+00:00"} {"global_step": 231702, "acc_step": 0, "speed/wps": 5510.4384352795005, "speed/FLOPS": 243533173858598.72, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.03 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.03, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041677966713905334, "optim/lr": 2.5891195964676818e-05, "optim/total_tokens": 1943657250816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.289377212524414, "created_at": "2025-06-03T04:59:12.006708+00:00"} {"global_step": 231703, "acc_step": 0, "speed/wps": 5521.665809452495, "speed/FLOPS": 244029366330134.56, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047609176486730576, "optim/lr": 2.588764873958227e-05, "optim/total_tokens": 1943665639424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2879632711410522, "created_at": "2025-06-03T04:59:14.979065+00:00"} {"global_step": 231704, "acc_step": 0, "speed/wps": 5514.93952163693, "speed/FLOPS": 243732098836948.66, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04393429309129715, "optim/lr": 2.5884101514487722e-05, "optim/total_tokens": 1943674028032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.290299415588379, "created_at": "2025-06-03T04:59:17.957105+00:00"} {"global_step": 231705, "acc_step": 0, "speed/wps": 5511.286884541318, "speed/FLOPS": 243570670973214.03, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044003162533044815, "optim/lr": 2.5880554289393175e-05, "optim/total_tokens": 1943682416640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.296244502067566, "created_at": "2025-06-03T04:59:20.933691+00:00"} {"global_step": 231706, "acc_step": 0, "speed/wps": 5523.421197890676, "speed/FLOPS": 244106945514209.62, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04286923632025719, "optim/lr": 2.5877007064298853e-05, "optim/total_tokens": 1943690805248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2923126220703125, "created_at": "2025-06-03T04:59:23.904472+00:00"} {"global_step": 231707, "acc_step": 0, "speed/wps": 5517.20836655958, "speed/FLOPS": 243832370169528.72, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04724562540650368, "optim/lr": 2.5873459839204306e-05, "optim/total_tokens": 1943699193856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2948024272918701, "created_at": "2025-06-03T04:59:26.882790+00:00"} {"global_step": 231708, "acc_step": 0, "speed/wps": 5522.145525049439, "speed/FLOPS": 244050567304112.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.048470158129930496, "optim/lr": 2.586991261410976e-05, "optim/total_tokens": 1943707582464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2960442304611206, "created_at": "2025-06-03T04:59:29.853325+00:00"} {"global_step": 231709, "acc_step": 0, "speed/wps": 5525.792110640753, "speed/FLOPS": 244211727722331.47, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04239845275878906, "optim/lr": 2.586636538901521e-05, "optim/total_tokens": 1943715971072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2922254800796509, "created_at": "2025-06-03T04:59:32.822539+00:00"} {"global_step": 231710, "acc_step": 0, "speed/wps": 5516.135408582546, "speed/FLOPS": 243784950918840.6, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04823126643896103, "optim/lr": 2.5862818163920887e-05, "optim/total_tokens": 1943724359680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2898591756820679, "created_at": "2025-06-03T04:59:35.797721+00:00"} {"global_step": 231711, "acc_step": 0, "speed/wps": 5515.871789449056, "speed/FLOPS": 243773300302465.38, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043865419924259186, "optim/lr": 2.585927093882634e-05, "optim/total_tokens": 1943732748288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2923749685287476, "created_at": "2025-06-03T04:59:38.771579+00:00"} {"global_step": 231712, "acc_step": 0, "speed/wps": 5508.266688714196, "speed/FLOPS": 243437193776418.88, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.02 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.02, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04155442491173744, "optim/lr": 2.5855723713731795e-05, "optim/total_tokens": 1943741136896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.279164433479309, "created_at": "2025-06-03T04:59:41.750600+00:00"} {"global_step": 231713, "acc_step": 0, "speed/wps": 5514.017574820669, "speed/FLOPS": 243691353506621.5, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042182765901088715, "optim/lr": 2.5852176488637248e-05, "optim/total_tokens": 1943749525504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2816483974456787, "created_at": "2025-06-03T04:59:44.727509+00:00"} {"global_step": 231714, "acc_step": 0, "speed/wps": 5524.0072816742895, "speed/FLOPS": 244132847417596.6, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041645199060440063, "optim/lr": 2.5848629263542922e-05, "optim/total_tokens": 1943757914112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2905768156051636, "created_at": "2025-06-03T04:59:47.697172+00:00"} {"global_step": 231715, "acc_step": 0, "speed/wps": 5524.21849552959, "speed/FLOPS": 244142181988910.38, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04191445931792259, "optim/lr": 2.5845082038448376e-05, "optim/total_tokens": 1943766302720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2806357145309448, "created_at": "2025-06-03T04:59:50.667600+00:00"} {"global_step": 231716, "acc_step": 0, "speed/wps": 5516.6717445775985, "speed/FLOPS": 243808654224605.4, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04165448620915413, "optim/lr": 2.584153481335383e-05, "optim/total_tokens": 1943774691328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3036713600158691, "created_at": "2025-06-03T04:59:53.641528+00:00"} {"global_step": 231717, "acc_step": 0, "speed/wps": 5517.982891769856, "speed/FLOPS": 243866600219443.5, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04139413684606552, "optim/lr": 2.5837987588259503e-05, "optim/total_tokens": 1943783079936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2965589761734009, "created_at": "2025-06-03T04:59:56.617901+00:00"} {"global_step": 231718, "acc_step": 0, "speed/wps": 5516.121387475304, "speed/FLOPS": 243784331257667.0, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042391713708639145, "optim/lr": 2.5834440363164957e-05, "optim/total_tokens": 1943791468544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2949974536895752, "created_at": "2025-06-03T04:59:59.596846+00:00"} {"global_step": 231719, "acc_step": 0, "speed/wps": 5518.407860318082, "speed/FLOPS": 243885381654088.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04217194765806198, "optim/lr": 2.583089313807041e-05, "optim/total_tokens": 1943799857152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3000630140304565, "created_at": "2025-06-03T05:00:02.574554+00:00"} {"global_step": 231720, "acc_step": 0, "speed/wps": 5523.165320134423, "speed/FLOPS": 244095637027084.34, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04213576018810272, "optim/lr": 2.5827345912975864e-05, "optim/total_tokens": 1943808245760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2986761331558228, "created_at": "2025-06-03T05:00:05.545093+00:00"} {"global_step": 231721, "acc_step": 0, "speed/wps": 5519.007099415717, "speed/FLOPS": 243911864955020.56, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042160242795944214, "optim/lr": 2.5823798687881538e-05, "optim/total_tokens": 1943816634368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3100366592407227, "created_at": "2025-06-03T05:00:08.518119+00:00"} {"global_step": 231722, "acc_step": 0, "speed/wps": 5515.525630223433, "speed/FLOPS": 243758001836496.38, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041775815188884735, "optim/lr": 2.582025146278699e-05, "optim/total_tokens": 1943825022976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.279619574546814, "created_at": "2025-06-03T05:00:11.492432+00:00"} {"global_step": 231723, "acc_step": 0, "speed/wps": 5524.353931305768, "speed/FLOPS": 244148167556994.3, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041762351989746094, "optim/lr": 2.5816704237692445e-05, "optim/total_tokens": 1943833411584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3004562854766846, "created_at": "2025-06-03T05:00:14.462197+00:00"} {"global_step": 231724, "acc_step": 0, "speed/wps": 5530.05129717808, "speed/FLOPS": 244399961966788.38, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04204575717449188, "optim/lr": 2.58131570125979e-05, "optim/total_tokens": 1943841800192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.300632357597351, "created_at": "2025-06-03T05:00:17.428248+00:00"} {"global_step": 231725, "acc_step": 0, "speed/wps": 5527.295853347346, "speed/FLOPS": 244278185453109.97, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 190.75, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04310039058327675, "optim/lr": 2.5809609787503576e-05, "optim/total_tokens": 1943850188800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2970949411392212, "created_at": "2025-06-03T05:00:20.396559+00:00"} {"global_step": 231726, "acc_step": 0, "speed/wps": 5530.3098296205135, "speed/FLOPS": 244411387777454.94, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042642220854759216, "optim/lr": 2.5806062562409026e-05, "optim/total_tokens": 1943858577408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2888985872268677, "created_at": "2025-06-03T05:00:23.368025+00:00"} {"global_step": 231727, "acc_step": 0, "speed/wps": 5504.0511626856405, "speed/FLOPS": 243250889102974.94, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "6.01 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 6.01, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04183446243405342, "optim/lr": 2.580251533731448e-05, "optim/total_tokens": 1943866966016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.281627893447876, "created_at": "2025-06-03T05:00:26.349158+00:00"} {"global_step": 231728, "acc_step": 0, "speed/wps": 5513.154204328426, "speed/FLOPS": 243653196949995.12, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "6.0 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 6.0, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04238379746675491, "optim/lr": 2.5798968112219933e-05, "optim/total_tokens": 1943875354624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.284022569656372, "created_at": "2025-06-03T05:00:29.327279+00:00"} {"global_step": 231729, "acc_step": 0, "speed/wps": 5521.98736135503, "speed/FLOPS": 244043577278374.78, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04249099642038345, "optim/lr": 2.579542088712561e-05, "optim/total_tokens": 1943883743232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3021481037139893, "created_at": "2025-06-03T05:00:32.303065+00:00"} {"global_step": 231730, "acc_step": 0, "speed/wps": 5531.502360416796, "speed/FLOPS": 244464091534724.7, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04256832227110863, "optim/lr": 2.5791873662031064e-05, "optim/total_tokens": 1943892131840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3039872646331787, "created_at": "2025-06-03T05:00:35.269632+00:00"} {"global_step": 231731, "acc_step": 0, "speed/wps": 5536.86910277054, "speed/FLOPS": 244701274077282.62, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0423404760658741, "optim/lr": 2.5788326436936514e-05, "optim/total_tokens": 1943900520448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3158541917800903, "created_at": "2025-06-03T05:00:38.234068+00:00"} {"global_step": 231732, "acc_step": 0, "speed/wps": 5529.641296531813, "speed/FLOPS": 244381842036796.94, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04597633332014084, "optim/lr": 2.5784779211841968e-05, "optim/total_tokens": 1943908909056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3119370937347412, "created_at": "2025-06-03T05:00:41.203861+00:00"} {"global_step": 231733, "acc_step": 0, "speed/wps": 5535.224955506718, "speed/FLOPS": 244628611183730.28, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04197511449456215, "optim/lr": 2.5781231986747645e-05, "optim/total_tokens": 1943917297664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3099080324172974, "created_at": "2025-06-03T05:00:44.173393+00:00"} {"global_step": 231734, "acc_step": 0, "speed/wps": 5533.851414413781, "speed/FLOPS": 244567907697843.1, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04336829483509064, "optim/lr": 2.57776847616531e-05, "optim/total_tokens": 1943925686272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2888895273208618, "created_at": "2025-06-03T05:00:47.142091+00:00"} {"global_step": 231735, "acc_step": 0, "speed/wps": 5517.065952207366, "speed/FLOPS": 243826076184103.56, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04824550822377205, "optim/lr": 2.5774137536558552e-05, "optim/total_tokens": 1943934074880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2994015216827393, "created_at": "2025-06-03T05:00:50.116968+00:00"} {"global_step": 231736, "acc_step": 0, "speed/wps": 5522.618958773708, "speed/FLOPS": 244071490651471.7, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04300122708082199, "optim/lr": 2.5770590311464002e-05, "optim/total_tokens": 1943942463488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3095645904541016, "created_at": "2025-06-03T05:00:53.090262+00:00"} {"global_step": 231737, "acc_step": 0, "speed/wps": 5524.489095711668, "speed/FLOPS": 244154141131900.9, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042448244988918304, "optim/lr": 2.576704308636968e-05, "optim/total_tokens": 1943950852096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2979289293289185, "created_at": "2025-06-03T05:00:56.063604+00:00"} {"global_step": 231738, "acc_step": 0, "speed/wps": 5514.890822464041, "speed/FLOPS": 243729946582771.9, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.99 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.99, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043313078582286835, "optim/lr": 2.5763495861275133e-05, "optim/total_tokens": 1943959240704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2884958982467651, "created_at": "2025-06-03T05:00:59.039219+00:00"} {"global_step": 231739, "acc_step": 0, "speed/wps": 5531.760668059061, "speed/FLOPS": 244475507410374.4, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04349770396947861, "optim/lr": 2.5759948636180587e-05, "optim/total_tokens": 1943967629312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3004661798477173, "created_at": "2025-06-03T05:01:02.005631+00:00"} {"global_step": 231740, "acc_step": 0, "speed/wps": 5536.404182144035, "speed/FLOPS": 244680726965270.6, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05818453058600426, "optim/lr": 2.575640141108604e-05, "optim/total_tokens": 1943976017920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2967864274978638, "created_at": "2025-06-03T05:01:04.968756+00:00"} {"global_step": 231741, "acc_step": 0, "speed/wps": 5536.359448502588, "speed/FLOPS": 244678749967286.16, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.45, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04763277620077133, "optim/lr": 2.5752854185991714e-05, "optim/total_tokens": 1943984406528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3117785453796387, "created_at": "2025-06-03T05:01:07.931918+00:00"} {"global_step": 231742, "acc_step": 0, "speed/wps": 5538.344029085526, "speed/FLOPS": 244766458271047.75, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.39, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04832157865166664, "optim/lr": 2.5749306960897168e-05, "optim/total_tokens": 1943992795136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.3010179996490479, "created_at": "2025-06-03T05:01:10.894076+00:00"} {"global_step": 231743, "acc_step": 0, "speed/wps": 5531.970403433935, "speed/FLOPS": 244484776640420.88, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.048833996057510376, "optim/lr": 2.574575973580262e-05, "optim/total_tokens": 1944001183744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2968608140945435, "created_at": "2025-06-03T05:01:13.859421+00:00"} {"global_step": 231744, "acc_step": 0, "speed/wps": 5526.960946742803, "speed/FLOPS": 244263384295396.56, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043868158012628555, "optim/lr": 2.5742212510708295e-05, "optim/total_tokens": 1944009572352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2900663614273071, "created_at": "2025-06-03T05:01:16.830974+00:00"} {"global_step": 231745, "acc_step": 0, "speed/wps": 5534.815811620564, "speed/FLOPS": 244610529118150.53, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05368320271372795, "optim/lr": 2.573866528561375e-05, "optim/total_tokens": 1944017960960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3000856637954712, "created_at": "2025-06-03T05:01:19.794700+00:00"} {"global_step": 231746, "acc_step": 0, "speed/wps": 5523.154409214013, "speed/FLOPS": 244095154820249.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04147861897945404, "optim/lr": 2.5735118060519203e-05, "optim/total_tokens": 1944026349568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2889676094055176, "created_at": "2025-06-03T05:01:22.766738+00:00"} {"global_step": 231747, "acc_step": 0, "speed/wps": 5517.875426080407, "speed/FLOPS": 243861850786029.12, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05780327320098877, "optim/lr": 2.5731570835424656e-05, "optim/total_tokens": 1944034738176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.288114070892334, "created_at": "2025-06-03T05:01:25.739780+00:00"} {"global_step": 231748, "acc_step": 0, "speed/wps": 5524.539240560075, "speed/FLOPS": 244156357277535.94, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04194507747888565, "optim/lr": 2.572802361033033e-05, "optim/total_tokens": 1944043126784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2904385328292847, "created_at": "2025-06-03T05:01:28.709562+00:00"} {"global_step": 231749, "acc_step": 0, "speed/wps": 5524.405161424415, "speed/FLOPS": 244150431666019.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.056760676205158234, "optim/lr": 2.5724476385235784e-05, "optim/total_tokens": 1944051515392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3044580221176147, "created_at": "2025-06-03T05:01:31.679050+00:00"} {"global_step": 231750, "acc_step": 0, "speed/wps": 5530.251162659216, "speed/FLOPS": 244408794998050.3, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.6, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043252263218164444, "optim/lr": 2.5720929160141237e-05, "optim/total_tokens": 1944059904000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3019989728927612, "created_at": "2025-06-03T05:01:34.646372+00:00"} {"global_step": 231751, "acc_step": 0, "speed/wps": 5530.545837819357, "speed/FLOPS": 244421818131844.34, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05849580094218254, "optim/lr": 2.571738193504669e-05, "optim/total_tokens": 1944068292608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.298607349395752, "created_at": "2025-06-03T05:01:37.617386+00:00"} {"global_step": 231752, "acc_step": 0, "speed/wps": 5519.852626995686, "speed/FLOPS": 243949232946252.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04684506729245186, "optim/lr": 2.5713834709952365e-05, "optim/total_tokens": 1944076681216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2844958305358887, "created_at": "2025-06-03T05:01:40.592612+00:00"} {"global_step": 231753, "acc_step": 0, "speed/wps": 5533.2882466951305, "speed/FLOPS": 244543018567232.44, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.050543900579214096, "optim/lr": 2.5710287484857818e-05, "optim/total_tokens": 1944085069824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3047674894332886, "created_at": "2025-06-03T05:01:43.557466+00:00"} {"global_step": 231754, "acc_step": 0, "speed/wps": 5536.087439461649, "speed/FLOPS": 244666728559945.16, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.41, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04366559907793999, "optim/lr": 2.5706740259763272e-05, "optim/total_tokens": 1944093458432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2860652208328247, "created_at": "2025-06-03T05:01:46.525589+00:00"} {"global_step": 231755, "acc_step": 0, "speed/wps": 5513.970218799808, "speed/FLOPS": 243689260612889.53, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047306980937719345, "optim/lr": 2.5703193034668725e-05, "optim/total_tokens": 1944101847040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2999844551086426, "created_at": "2025-06-03T05:01:49.504954+00:00"} {"global_step": 231756, "acc_step": 0, "speed/wps": 5514.245734457215, "speed/FLOPS": 243701436994729.94, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04120168462395668, "optim/lr": 2.5699645809574403e-05, "optim/total_tokens": 1944110235648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2956597805023193, "created_at": "2025-06-03T05:01:52.482191+00:00"} {"global_step": 231757, "acc_step": 0, "speed/wps": 5522.366481542474, "speed/FLOPS": 244060332450146.75, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.049524519592523575, "optim/lr": 2.5696098584479853e-05, "optim/total_tokens": 1944118624256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2967138290405273, "created_at": "2025-06-03T05:01:55.455773+00:00"} {"global_step": 231758, "acc_step": 0, "speed/wps": 5535.749831842305, "speed/FLOPS": 244651808031202.6, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.49, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04237568378448486, "optim/lr": 2.5692551359385307e-05, "optim/total_tokens": 1944127012864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3008612394332886, "created_at": "2025-06-03T05:01:58.424933+00:00"} {"global_step": 231759, "acc_step": 0, "speed/wps": 5522.489400885407, "speed/FLOPS": 244065764855946.2, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05036359652876854, "optim/lr": 2.568900413429076e-05, "optim/total_tokens": 1944135401472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2832902669906616, "created_at": "2025-06-03T05:02:01.399878+00:00"} {"global_step": 231760, "acc_step": 0, "speed/wps": 5532.751971142715, "speed/FLOPS": 244519317932722.78, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.53, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04209606349468231, "optim/lr": 2.5685456909196437e-05, "optim/total_tokens": 1944143790080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.273309588432312, "created_at": "2025-06-03T05:02:04.369293+00:00"} {"global_step": 231761, "acc_step": 0, "speed/wps": 5524.067339642587, "speed/FLOPS": 244135501672390.8, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05003722384572029, "optim/lr": 2.568190968410189e-05, "optim/total_tokens": 1944152178688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2960946559906006, "created_at": "2025-06-03T05:02:07.342112+00:00"} {"global_step": 231762, "acc_step": 0, "speed/wps": 5515.506517055751, "speed/FLOPS": 243757157132314.88, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04655929282307625, "optim/lr": 2.567836245900734e-05, "optim/total_tokens": 1944160567296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2939783334732056, "created_at": "2025-06-03T05:02:10.317394+00:00"} {"global_step": 231763, "acc_step": 0, "speed/wps": 5518.648786973566, "speed/FLOPS": 243896029379086.84, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044806674122810364, "optim/lr": 2.5674815233912795e-05, "optim/total_tokens": 1944168955904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2984157800674438, "created_at": "2025-06-03T05:02:13.292833+00:00"} {"global_step": 231764, "acc_step": 0, "speed/wps": 5523.923907962223, "speed/FLOPS": 244129162726268.62, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04370550811290741, "optim/lr": 2.5671268008818472e-05, "optim/total_tokens": 1944177344512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2945363521575928, "created_at": "2025-06-03T05:02:16.266362+00:00"} {"global_step": 231765, "acc_step": 0, "speed/wps": 5523.284737468408, "speed/FLOPS": 244100914662013.16, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04720316827297211, "optim/lr": 2.5667720783723926e-05, "optim/total_tokens": 1944185733120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2848199605941772, "created_at": "2025-06-03T05:02:19.236730+00:00"} {"global_step": 231766, "acc_step": 0, "speed/wps": 5519.024900188477, "speed/FLOPS": 243912651658063.97, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04415730759501457, "optim/lr": 2.566417355862938e-05, "optim/total_tokens": 1944194121728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.29989755153656, "created_at": "2025-06-03T05:02:22.212341+00:00"} {"global_step": 231767, "acc_step": 0, "speed/wps": 5533.557534805564, "speed/FLOPS": 244554919723372.1, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.52, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044070661067962646, "optim/lr": 2.566062633353483e-05, "optim/total_tokens": 1944202510336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2949507236480713, "created_at": "2025-06-03T05:02:25.180462+00:00"} {"global_step": 231768, "acc_step": 0, "speed/wps": 5517.105954310442, "speed/FLOPS": 243827844072310.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04684945568442345, "optim/lr": 2.5657079108440507e-05, "optim/total_tokens": 1944210898944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.294920563697815, "created_at": "2025-06-03T05:02:28.159013+00:00"} {"global_step": 231769, "acc_step": 0, "speed/wps": 5536.3942607769395, "speed/FLOPS": 244680288491627.12, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.48, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0421530082821846, "optim/lr": 2.565353188334596e-05, "optim/total_tokens": 1944219287552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2893675565719604, "created_at": "2025-06-03T05:02:31.124196+00:00"} {"global_step": 231770, "acc_step": 0, "speed/wps": 5534.282070399757, "speed/FLOPS": 244586940488126.06, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042758967727422714, "optim/lr": 2.5649984658251414e-05, "optim/total_tokens": 1944227676160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2954127788543701, "created_at": "2025-06-03T05:02:34.088436+00:00"} {"global_step": 231771, "acc_step": 0, "speed/wps": 5519.508672921341, "speed/FLOPS": 243934031936683.22, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042374417185783386, "optim/lr": 2.5646437433157088e-05, "optim/total_tokens": 1944236064768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2903940677642822, "created_at": "2025-06-03T05:02:37.060638+00:00"} {"global_step": 231772, "acc_step": 0, "speed/wps": 5501.851273403025, "speed/FLOPS": 243153665256737.4, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.98 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.98, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043042559176683426, "optim/lr": 2.564289020806254e-05, "optim/total_tokens": 1944244453376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 358, "loss/out": 1.308876872062683, "created_at": "2025-06-03T05:02:40.046784+00:00"} {"global_step": 231773, "acc_step": 0, "speed/wps": 5522.546866564951, "speed/FLOPS": 244068304544846.03, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04300370812416077, "optim/lr": 2.5639342982967995e-05, "optim/total_tokens": 1944252841984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3018982410430908, "created_at": "2025-06-03T05:02:43.023251+00:00"} {"global_step": 231774, "acc_step": 0, "speed/wps": 5526.6326088495, "speed/FLOPS": 244248873441098.28, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04167580232024193, "optim/lr": 2.563579575787345e-05, "optim/total_tokens": 1944261230592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2944340705871582, "created_at": "2025-06-03T05:02:45.992556+00:00"} {"global_step": 231775, "acc_step": 0, "speed/wps": 5534.512896968947, "speed/FLOPS": 244597141841006.78, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.54, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04510748013854027, "optim/lr": 2.5632248532779122e-05, "optim/total_tokens": 1944269619200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2906285524368286, "created_at": "2025-06-03T05:02:48.957081+00:00"} {"global_step": 231776, "acc_step": 0, "speed/wps": 5515.8757581119235, "speed/FLOPS": 243773475697050.66, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04284442588686943, "optim/lr": 2.5628701307684576e-05, "optim/total_tokens": 1944278007808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2935810089111328, "created_at": "2025-06-03T05:02:51.934857+00:00"} {"global_step": 231777, "acc_step": 0, "speed/wps": 5521.800557674709, "speed/FLOPS": 244035321511852.5, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04229341447353363, "optim/lr": 2.562515408259003e-05, "optim/total_tokens": 1944286396416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2995681762695312, "created_at": "2025-06-03T05:02:54.909733+00:00"} {"global_step": 231778, "acc_step": 0, "speed/wps": 5528.164521157442, "speed/FLOPS": 244316576124071.34, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.77, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.048068027943372726, "optim/lr": 2.5621606857495483e-05, "optim/total_tokens": 1944294785024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2958018779754639, "created_at": "2025-06-03T05:02:57.882215+00:00"} {"global_step": 231779, "acc_step": 0, "speed/wps": 5508.711752371778, "speed/FLOPS": 243456863312041.7, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.050795476883649826, "optim/lr": 2.5618059632401157e-05, "optim/total_tokens": 1944303173632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.301660418510437, "created_at": "2025-06-03T05:03:00.861136+00:00"} {"global_step": 231780, "acc_step": 0, "speed/wps": 5503.015090294604, "speed/FLOPS": 243205100006390.38, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.97 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.97, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.043807175010442734, "optim/lr": 2.561451240730661e-05, "optim/total_tokens": 1944311562240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2742559909820557, "created_at": "2025-06-03T05:03:03.846500+00:00"} {"global_step": 231781, "acc_step": 0, "speed/wps": 5532.29988564271, "speed/FLOPS": 244499338067605.94, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05153118446469307, "optim/lr": 2.5610965182212064e-05, "optim/total_tokens": 1944319950848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2985700368881226, "created_at": "2025-06-03T05:03:06.812174+00:00"} {"global_step": 231782, "acc_step": 0, "speed/wps": 5525.371695349638, "speed/FLOPS": 244193147518344.72, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04328565672039986, "optim/lr": 2.5607417957117518e-05, "optim/total_tokens": 1944328339456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3071709871292114, "created_at": "2025-06-03T05:03:09.781278+00:00"} {"global_step": 231783, "acc_step": 0, "speed/wps": 5514.101500106176, "speed/FLOPS": 243695062574672.34, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.049294613301754, "optim/lr": 2.5603870732023195e-05, "optim/total_tokens": 1944336728064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.285126805305481, "created_at": "2025-06-03T05:03:12.757087+00:00"} {"global_step": 231784, "acc_step": 0, "speed/wps": 5515.9724138294405, "speed/FLOPS": 243777747385036.1, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04207436740398407, "optim/lr": 2.5600323506928645e-05, "optim/total_tokens": 1944345116672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3052109479904175, "created_at": "2025-06-03T05:03:15.730847+00:00"} {"global_step": 231785, "acc_step": 0, "speed/wps": 5532.75743622105, "speed/FLOPS": 244519559461212.38, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 190.61, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04777725040912628, "optim/lr": 2.55967762818341e-05, "optim/total_tokens": 1944353505280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2851033210754395, "created_at": "2025-06-03T05:03:18.695826+00:00"} {"global_step": 231786, "acc_step": 0, "speed/wps": 5520.972750808011, "speed/FLOPS": 243998736685444.12, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042502276599407196, "optim/lr": 2.5593229056739552e-05, "optim/total_tokens": 1944361893888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2936323881149292, "created_at": "2025-06-03T05:03:21.668784+00:00"} {"global_step": 231787, "acc_step": 0, "speed/wps": 5512.052895858721, "speed/FLOPS": 243604524752641.94, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 191.27, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05341094359755516, "optim/lr": 2.558968183164523e-05, "optim/total_tokens": 1944370282496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2964693307876587, "created_at": "2025-06-03T05:03:24.645452+00:00"} {"global_step": 231788, "acc_step": 0, "speed/wps": 5523.381483939406, "speed/FLOPS": 244105190360837.94, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04251904785633087, "optim/lr": 2.5586134606550683e-05, "optim/total_tokens": 1944378671104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2883968353271484, "created_at": "2025-06-03T05:03:27.618166+00:00"} {"global_step": 231789, "acc_step": 0, "speed/wps": 5521.544841312933, "speed/FLOPS": 244024020157537.0, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.050092488527297974, "optim/lr": 2.5582587381456134e-05, "optim/total_tokens": 1944387059712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2926839590072632, "created_at": "2025-06-03T05:03:30.591176+00:00"} {"global_step": 231790, "acc_step": 0, "speed/wps": 5507.849505766639, "speed/FLOPS": 243418756425472.75, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.96 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.96, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04360656812787056, "optim/lr": 2.5579040156361587e-05, "optim/total_tokens": 1944395448320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.288064956665039, "created_at": "2025-06-03T05:03:33.569942+00:00"} {"global_step": 231791, "acc_step": 0, "speed/wps": 5520.036526295359, "speed/FLOPS": 243957360354016.34, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.052350301295518875, "optim/lr": 2.5575492931267264e-05, "optim/total_tokens": 1944403836928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.293298602104187, "created_at": "2025-06-03T05:03:36.542126+00:00"} {"global_step": 231792, "acc_step": 0, "speed/wps": 5510.963051474613, "speed/FLOPS": 243556359209193.6, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04127391427755356, "optim/lr": 2.5571945706172718e-05, "optim/total_tokens": 1944412225536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2783513069152832, "created_at": "2025-06-03T05:03:39.518893+00:00"} {"global_step": 231793, "acc_step": 0, "speed/wps": 5519.651626452841, "speed/FLOPS": 243940349751073.03, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047812335193157196, "optim/lr": 2.556839848107817e-05, "optim/total_tokens": 1944420614144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2821238040924072, "created_at": "2025-06-03T05:03:42.494788+00:00"} {"global_step": 231794, "acc_step": 0, "speed/wps": 5515.641446004617, "speed/FLOPS": 243763120301225.78, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041075535118579865, "optim/lr": 2.5564851255983622e-05, "optim/total_tokens": 1944429002752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2803086042404175, "created_at": "2025-06-03T05:03:45.473401+00:00"} {"global_step": 231795, "acc_step": 0, "speed/wps": 5517.511008330817, "speed/FLOPS": 243845745386756.38, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.048051197081804276, "optim/lr": 2.55613040308893e-05, "optim/total_tokens": 1944437391360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.287054181098938, "created_at": "2025-06-03T05:03:48.447293+00:00"} {"global_step": 231796, "acc_step": 0, "speed/wps": 5515.742162284429, "speed/FLOPS": 243767571445280.8, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0425761453807354, "optim/lr": 2.5557756805794753e-05, "optim/total_tokens": 1944445779968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2996548414230347, "created_at": "2025-06-03T05:03:51.421762+00:00"} {"global_step": 231797, "acc_step": 0, "speed/wps": 5504.987931649403, "speed/FLOPS": 243292289496355.06, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.95 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.95, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04382743686437607, "optim/lr": 2.5554209580700206e-05, "optim/total_tokens": 1944454168576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.301118016242981, "created_at": "2025-06-03T05:03:54.403504+00:00"} {"global_step": 231798, "acc_step": 0, "speed/wps": 5525.631560274609, "speed/FLOPS": 244204632217919.2, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04243358597159386, "optim/lr": 2.555066235560566e-05, "optim/total_tokens": 1944462557184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2851033210754395, "created_at": "2025-06-03T05:03:57.372668+00:00"} {"global_step": 231799, "acc_step": 0, "speed/wps": 5531.606424491444, "speed/FLOPS": 244468690634175.9, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05201498419046402, "optim/lr": 2.5547115130511334e-05, "optim/total_tokens": 1944470945792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2905703783035278, "created_at": "2025-06-03T05:04:00.338834+00:00"} {"global_step": 231800, "acc_step": 0, "speed/wps": 5536.009575939057, "speed/FLOPS": 244663287390788.22, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.51, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04347561299800873, "optim/lr": 2.5543567905416787e-05, "optim/total_tokens": 1944479334400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3012863397598267, "created_at": "2025-06-03T05:04:03.302052+00:00"} {"global_step": 231801, "acc_step": 0, "speed/wps": 5527.849039711871, "speed/FLOPS": 244302633458957.5, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.045784302055835724, "optim/lr": 2.554002068032224e-05, "optim/total_tokens": 1944487723008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2873821258544922, "created_at": "2025-06-03T05:04:06.274330+00:00"} {"global_step": 231802, "acc_step": 0, "speed/wps": 5526.392117818427, "speed/FLOPS": 244238244968469.56, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041645877063274384, "optim/lr": 2.5536473455227915e-05, "optim/total_tokens": 1944496111616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3114545345306396, "created_at": "2025-06-03T05:04:09.242859+00:00"} {"global_step": 231803, "acc_step": 0, "speed/wps": 5523.268919887128, "speed/FLOPS": 244100215605882.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04910021275281906, "optim/lr": 2.553292623013337e-05, "optim/total_tokens": 1944504500224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2998666763305664, "created_at": "2025-06-03T05:04:12.215803+00:00"} {"global_step": 231804, "acc_step": 0, "speed/wps": 5518.136370446041, "speed/FLOPS": 243873383191355.78, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04323740676045418, "optim/lr": 2.5529379005038822e-05, "optim/total_tokens": 1944512888832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.284891128540039, "created_at": "2025-06-03T05:04:15.190003+00:00"} {"global_step": 231805, "acc_step": 0, "speed/wps": 5522.425993736351, "speed/FLOPS": 244062962584505.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04431081563234329, "optim/lr": 2.5525831779944276e-05, "optim/total_tokens": 1944521277440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2789061069488525, "created_at": "2025-06-03T05:04:18.161156+00:00"} {"global_step": 231806, "acc_step": 0, "speed/wps": 5520.815080927233, "speed/FLOPS": 243991768483741.3, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042765699326992035, "optim/lr": 2.552228455484995e-05, "optim/total_tokens": 1944529666048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2910220623016357, "created_at": "2025-06-03T05:04:21.132813+00:00"} {"global_step": 231807, "acc_step": 0, "speed/wps": 5527.2093313553, "speed/FLOPS": 244274361623921.25, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.82, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044474419206380844, "optim/lr": 2.5518737329755403e-05, "optim/total_tokens": 1944538054656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2899799346923828, "created_at": "2025-06-03T05:04:24.101432+00:00"} {"global_step": 231808, "acc_step": 0, "speed/wps": 5538.726773220012, "speed/FLOPS": 244783373602729.94, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.36, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04304831475019455, "optim/lr": 2.5515190104660857e-05, "optim/total_tokens": 1944546443264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2880175113677979, "created_at": "2025-06-03T05:04:27.063276+00:00"} {"global_step": 231809, "acc_step": 0, "speed/wps": 5524.559102102955, "speed/FLOPS": 244157235056070.62, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04373277351260185, "optim/lr": 2.551164287956631e-05, "optim/total_tokens": 1944554831872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2781680822372437, "created_at": "2025-06-03T05:04:30.036295+00:00"} {"global_step": 231810, "acc_step": 0, "speed/wps": 5522.1514285432895, "speed/FLOPS": 244050828208323.84, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04241861030459404, "optim/lr": 2.5508095654471984e-05, "optim/total_tokens": 1944563220480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3035168647766113, "created_at": "2025-06-03T05:04:33.007471+00:00"} {"global_step": 231811, "acc_step": 0, "speed/wps": 5521.1060547583875, "speed/FLOPS": 244004628037739.25, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04499975964426994, "optim/lr": 2.5504548429377438e-05, "optim/total_tokens": 1944571609088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2973922491073608, "created_at": "2025-06-03T05:04:35.980019+00:00"} {"global_step": 231812, "acc_step": 0, "speed/wps": 5526.7590592289525, "speed/FLOPS": 244254461900638.38, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042970117181539536, "optim/lr": 2.550100120428289e-05, "optim/total_tokens": 1944579997696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.3019944429397583, "created_at": "2025-06-03T05:04:38.948014+00:00"} {"global_step": 231813, "acc_step": 0, "speed/wps": 5505.806096648145, "speed/FLOPS": 243328448201551.34, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044700298458337784, "optim/lr": 2.5497453979188345e-05, "optim/total_tokens": 1944588386304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2977180480957031, "created_at": "2025-06-03T05:04:41.927556+00:00"} {"global_step": 231814, "acc_step": 0, "speed/wps": 5507.265491571626, "speed/FLOPS": 243392945987308.8, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.94 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.94, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042160045355558395, "optim/lr": 2.5493906754094022e-05, "optim/total_tokens": 1944596774912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2872765064239502, "created_at": "2025-06-03T05:04:44.906420+00:00"} {"global_step": 231815, "acc_step": 0, "speed/wps": 5513.4916870532825, "speed/FLOPS": 243668111959040.6, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047301508486270905, "optim/lr": 2.5490359528999472e-05, "optim/total_tokens": 1944605163520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2967731952667236, "created_at": "2025-06-03T05:04:47.883065+00:00"} {"global_step": 231816, "acc_step": 0, "speed/wps": 5523.3392681970945, "speed/FLOPS": 244103324641107.53, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0419599674642086, "optim/lr": 2.5486812303904926e-05, "optim/total_tokens": 1944613552128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2956963777542114, "created_at": "2025-06-03T05:04:50.858923+00:00"} {"global_step": 231817, "acc_step": 0, "speed/wps": 5527.830666963375, "speed/FLOPS": 244301821477514.22, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04662882536649704, "optim/lr": 2.548326507881038e-05, "optim/total_tokens": 1944621940736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2964558601379395, "created_at": "2025-06-03T05:04:53.826772+00:00"} {"global_step": 231818, "acc_step": 0, "speed/wps": 5518.789351809519, "speed/FLOPS": 243902241625359.9, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04835048317909241, "optim/lr": 2.5479717853716057e-05, "optim/total_tokens": 1944630329344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2881882190704346, "created_at": "2025-06-03T05:04:56.799836+00:00"} {"global_step": 231819, "acc_step": 0, "speed/wps": 5516.957379477411, "speed/FLOPS": 243821277825165.2, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04368222877383232, "optim/lr": 2.547617062862151e-05, "optim/total_tokens": 1944638717952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2967078685760498, "created_at": "2025-06-03T05:04:59.773411+00:00"} {"global_step": 231820, "acc_step": 0, "speed/wps": 5523.73188888531, "speed/FLOPS": 244120676465911.78, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.055385932326316833, "optim/lr": 2.547262340352696e-05, "optim/total_tokens": 1944647106560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2877079248428345, "created_at": "2025-06-03T05:05:02.744602+00:00"} {"global_step": 231821, "acc_step": 0, "speed/wps": 5524.087967091069, "speed/FLOPS": 244136413300032.88, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04337124153971672, "optim/lr": 2.5469076178432414e-05, "optim/total_tokens": 1944655495168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2968370914459229, "created_at": "2025-06-03T05:05:05.716366+00:00"} {"global_step": 231822, "acc_step": 0, "speed/wps": 5509.4048744464, "speed/FLOPS": 243487495760019.6, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.93 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.93, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05231449007987976, "optim/lr": 2.546552895333809e-05, "optim/total_tokens": 1944663883776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2908393144607544, "created_at": "2025-06-03T05:05:08.694780+00:00"} {"global_step": 231823, "acc_step": 0, "speed/wps": 5521.694457533351, "speed/FLOPS": 244030632428674.22, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04381849616765976, "optim/lr": 2.5461981728243545e-05, "optim/total_tokens": 1944672272384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2960164546966553, "created_at": "2025-06-03T05:05:11.668003+00:00"} {"global_step": 231824, "acc_step": 0, "speed/wps": 5533.026147553655, "speed/FLOPS": 244531435126724.25, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 190.58, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05511720851063728, "optim/lr": 2.5458434503149e-05, "optim/total_tokens": 1944680660992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2767417430877686, "created_at": "2025-06-03T05:05:14.632682+00:00"} {"global_step": 231825, "acc_step": 0, "speed/wps": 5523.778431484284, "speed/FLOPS": 244122733410559.8, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042647164314985275, "optim/lr": 2.5454887278054452e-05, "optim/total_tokens": 1944689049600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2927576303482056, "created_at": "2025-06-03T05:05:17.604422+00:00"} {"global_step": 231826, "acc_step": 0, "speed/wps": 5530.235613730529, "speed/FLOPS": 244408107814988.97, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 190.73, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05152612552046776, "optim/lr": 2.5451340052960126e-05, "optim/total_tokens": 1944697438208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.284382700920105, "created_at": "2025-06-03T05:05:20.574971+00:00"} {"global_step": 231827, "acc_step": 0, "speed/wps": 5523.853057375514, "speed/FLOPS": 244126031492982.25, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042807869613170624, "optim/lr": 2.544779282786558e-05, "optim/total_tokens": 1944705826816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.3046122789382935, "created_at": "2025-06-03T05:05:23.545247+00:00"} {"global_step": 231828, "acc_step": 0, "speed/wps": 5516.364709159285, "speed/FLOPS": 243795084830665.7, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04640832170844078, "optim/lr": 2.5444245602771033e-05, "optim/total_tokens": 1944714215424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2940289974212646, "created_at": "2025-06-03T05:05:26.521923+00:00"} {"global_step": 231829, "acc_step": 0, "speed/wps": 5516.324351532748, "speed/FLOPS": 243793301230141.8, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.22, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04258131980895996, "optim/lr": 2.5440698377676707e-05, "optim/total_tokens": 1944722604032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.275377869606018, "created_at": "2025-06-03T05:05:29.496594+00:00"} {"global_step": 231830, "acc_step": 0, "speed/wps": 5509.401187270979, "speed/FLOPS": 243487332805738.66, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04539664462208748, "optim/lr": 2.543715115258216e-05, "optim/total_tokens": 1944730992640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2903250455856323, "created_at": "2025-06-03T05:05:32.475886+00:00"} {"global_step": 231831, "acc_step": 0, "speed/wps": 5522.832002282214, "speed/FLOPS": 244080906084092.12, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 190.93, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04321993887424469, "optim/lr": 2.5433603927487614e-05, "optim/total_tokens": 1944739381248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2876752614974976, "created_at": "2025-06-03T05:05:35.447922+00:00"} {"global_step": 231832, "acc_step": 0, "speed/wps": 5519.851202467814, "speed/FLOPS": 243949169989412.2, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04253728687763214, "optim/lr": 2.5430056702393068e-05, "optim/total_tokens": 1944747769856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2882884740829468, "created_at": "2025-06-03T05:05:38.422307+00:00"} {"global_step": 231833, "acc_step": 0, "speed/wps": 5519.71258426828, "speed/FLOPS": 243943043774505.06, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042448364198207855, "optim/lr": 2.5426509477298742e-05, "optim/total_tokens": 1944756158464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2899000644683838, "created_at": "2025-06-03T05:05:41.401353+00:00"} {"global_step": 231834, "acc_step": 0, "speed/wps": 5529.058294547229, "speed/FLOPS": 244356076333152.97, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04305517300963402, "optim/lr": 2.5422962252204195e-05, "optim/total_tokens": 1944764547072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.3028743267059326, "created_at": "2025-06-03T05:05:44.373697+00:00"} {"global_step": 231835, "acc_step": 0, "speed/wps": 5519.943424628489, "speed/FLOPS": 243953245736878.22, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04286166653037071, "optim/lr": 2.541941502710965e-05, "optim/total_tokens": 1944772935680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2848485708236694, "created_at": "2025-06-03T05:05:47.351719+00:00"} {"global_step": 231836, "acc_step": 0, "speed/wps": 5505.341952620681, "speed/FLOPS": 243307935411241.9, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.92 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.92, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04176514968276024, "optim/lr": 2.5415867802015103e-05, "optim/total_tokens": 1944781324288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2971049547195435, "created_at": "2025-06-03T05:05:50.336244+00:00"} {"global_step": 231837, "acc_step": 0, "speed/wps": 5515.943982477011, "speed/FLOPS": 243776490864783.53, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04365869238972664, "optim/lr": 2.5412320576920776e-05, "optim/total_tokens": 1944789712896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3039348125457764, "created_at": "2025-06-03T05:05:53.310009+00:00"} {"global_step": 231838, "acc_step": 0, "speed/wps": 5514.823065855427, "speed/FLOPS": 243726952087480.9, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04175642877817154, "optim/lr": 2.540877335182623e-05, "optim/total_tokens": 1944798101504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.310534954071045, "created_at": "2025-06-03T05:05:56.284819+00:00"} {"global_step": 231839, "acc_step": 0, "speed/wps": 5524.450912574547, "speed/FLOPS": 244152453632679.22, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04254517704248428, "optim/lr": 2.5405226126731684e-05, "optim/total_tokens": 1944806490112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2813862562179565, "created_at": "2025-06-03T05:05:59.257782+00:00"} {"global_step": 231840, "acc_step": 0, "speed/wps": 5519.665238615934, "speed/FLOPS": 243940951339008.38, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04271313175559044, "optim/lr": 2.5401678901637137e-05, "optim/total_tokens": 1944814878720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2899278402328491, "created_at": "2025-06-03T05:06:02.230728+00:00"} {"global_step": 231841, "acc_step": 0, "speed/wps": 5527.554283219531, "speed/FLOPS": 244289606730696.56, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.041507065296173096, "optim/lr": 2.5398131676542814e-05, "optim/total_tokens": 1944823267328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.291812777519226, "created_at": "2025-06-03T05:06:05.200603+00:00"} {"global_step": 231842, "acc_step": 0, "speed/wps": 5525.73083622949, "speed/FLOPS": 244209019706984.53, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04176335409283638, "optim/lr": 2.5394584451448265e-05, "optim/total_tokens": 1944831655936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2983235120773315, "created_at": "2025-06-03T05:06:08.170008+00:00"} {"global_step": 231843, "acc_step": 0, "speed/wps": 5526.662177906778, "speed/FLOPS": 244250180242081.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04413583129644394, "optim/lr": 2.5391037226353718e-05, "optim/total_tokens": 1944840044544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3057328462600708, "created_at": "2025-06-03T05:06:11.139477+00:00"} {"global_step": 231844, "acc_step": 0, "speed/wps": 5519.296429015444, "speed/FLOPS": 243924651842405.38, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04222811758518219, "optim/lr": 2.5387490001259172e-05, "optim/total_tokens": 1944848433152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2815594673156738, "created_at": "2025-06-03T05:06:14.111700+00:00"} {"global_step": 231845, "acc_step": 0, "speed/wps": 5516.576712938739, "speed/FLOPS": 243804454312583.84, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04267125576734543, "optim/lr": 2.538394277616485e-05, "optim/total_tokens": 1944856821760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3014999628067017, "created_at": "2025-06-03T05:06:17.085580+00:00"} {"global_step": 231846, "acc_step": 0, "speed/wps": 5508.433413577992, "speed/FLOPS": 243444562162023.44, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04314475506544113, "optim/lr": 2.5380395551070303e-05, "optim/total_tokens": 1944865210368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2924933433532715, "created_at": "2025-06-03T05:06:20.067057+00:00"} {"global_step": 231847, "acc_step": 0, "speed/wps": 5504.517682062499, "speed/FLOPS": 243271506871569.47, "speed/curr_iter_time": 2.9757, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9757, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0419192910194397, "optim/lr": 2.5376848325975753e-05, "optim/total_tokens": 1944873598976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.30907142162323, "created_at": "2025-06-03T05:06:23.050861+00:00"} {"global_step": 231848, "acc_step": 0, "speed/wps": 5519.945299525844, "speed/FLOPS": 243953328597744.72, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044106706976890564, "optim/lr": 2.5373301100881206e-05, "optim/total_tokens": 1944881987584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.297694206237793, "created_at": "2025-06-03T05:06:26.022625+00:00"} {"global_step": 231849, "acc_step": 0, "speed/wps": 5517.950968222032, "speed/FLOPS": 243865189362029.22, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0427325963973999, "optim/lr": 2.5369753875786884e-05, "optim/total_tokens": 1944890376192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2995587587356567, "created_at": "2025-06-03T05:06:29.000941+00:00"} {"global_step": 231850, "acc_step": 0, "speed/wps": 5520.351596441984, "speed/FLOPS": 243971284841821.97, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04786102473735809, "optim/lr": 2.5366206650692337e-05, "optim/total_tokens": 1944898764800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2900296449661255, "created_at": "2025-06-03T05:06:31.976471+00:00"} {"global_step": 231851, "acc_step": 0, "speed/wps": 5515.325756495703, "speed/FLOPS": 243749168440777.2, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0021, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042182281613349915, "optim/lr": 2.536265942559779e-05, "optim/total_tokens": 1944907153408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.289908766746521, "created_at": "2025-06-03T05:06:34.950774+00:00"} {"global_step": 231852, "acc_step": 0, "speed/wps": 5520.725615925887, "speed/FLOPS": 243987814588605.2, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.06007181480526924, "optim/lr": 2.535911220050324e-05, "optim/total_tokens": 1944915542016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2964097261428833, "created_at": "2025-06-03T05:06:37.923599+00:00"} {"global_step": 231853, "acc_step": 0, "speed/wps": 5515.722768756922, "speed/FLOPS": 243766714350630.1, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04571708291769028, "optim/lr": 2.535556497540892e-05, "optim/total_tokens": 1944923930624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2932072877883911, "created_at": "2025-06-03T05:06:40.900809+00:00"} {"global_step": 231854, "acc_step": 0, "speed/wps": 5513.242898849678, "speed/FLOPS": 243657116793854.75, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.05196944624185562, "optim/lr": 2.5352017750314372e-05, "optim/total_tokens": 1944932319232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2848374843597412, "created_at": "2025-06-03T05:06:43.876412+00:00"} {"global_step": 231855, "acc_step": 0, "speed/wps": 5519.15518383643, "speed/FLOPS": 243918409528451.34, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04470903426408768, "optim/lr": 2.5348470525219826e-05, "optim/total_tokens": 1944940707840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2850970029830933, "created_at": "2025-06-03T05:06:46.851261+00:00"} {"global_step": 231856, "acc_step": 0, "speed/wps": 5510.1997946537485, "speed/FLOPS": 243522627164413.94, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04553929716348648, "optim/lr": 2.53449233001255e-05, "optim/total_tokens": 1944949096448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3031487464904785, "created_at": "2025-06-03T05:06:49.829956+00:00"} {"global_step": 231857, "acc_step": 0, "speed/wps": 5511.980441543317, "speed/FLOPS": 243601322642755.88, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04334954544901848, "optim/lr": 2.5341376075030953e-05, "optim/total_tokens": 1944957485056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3022404909133911, "created_at": "2025-06-03T05:06:52.809848+00:00"} {"global_step": 231858, "acc_step": 0, "speed/wps": 5493.417665009578, "speed/FLOPS": 242780942932868.03, "speed/curr_iter_time": 2.9797, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9797, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.91 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.91, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04202478379011154, "optim/lr": 2.5337828849936407e-05, "optim/total_tokens": 1944965873664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2920293807983398, "created_at": "2025-06-03T05:06:55.795558+00:00"} {"global_step": 231859, "acc_step": 0, "speed/wps": 5513.790998901248, "speed/FLOPS": 243681340010703.75, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04324563965201378, "optim/lr": 2.533428162484186e-05, "optim/total_tokens": 1944974262272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3031936883926392, "created_at": "2025-06-03T05:06:58.771424+00:00"} {"global_step": 231860, "acc_step": 0, "speed/wps": 5506.275149309715, "speed/FLOPS": 243349177928363.56, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04411663860082626, "optim/lr": 2.5330734399747534e-05, "optim/total_tokens": 1944982650880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2938404083251953, "created_at": "2025-06-03T05:07:01.755249+00:00"} {"global_step": 231861, "acc_step": 0, "speed/wps": 5507.941397599203, "speed/FLOPS": 243422817574127.06, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.044194694608449936, "optim/lr": 2.5327187174652988e-05, "optim/total_tokens": 1944991039488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2881768941879272, "created_at": "2025-06-03T05:07:04.736959+00:00"} {"global_step": 231862, "acc_step": 0, "speed/wps": 5506.787543196771, "speed/FLOPS": 243371823115501.78, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.046452298760414124, "optim/lr": 2.532363994955844e-05, "optim/total_tokens": 1944999428096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2772977352142334, "created_at": "2025-06-03T05:07:07.716156+00:00"} {"global_step": 231863, "acc_step": 0, "speed/wps": 5505.111691880257, "speed/FLOPS": 243297759065096.5, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0449492372572422, "optim/lr": 2.5320092724463895e-05, "optim/total_tokens": 1945007816704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2848268747329712, "created_at": "2025-06-03T05:07:10.696230+00:00"} {"global_step": 231864, "acc_step": 0, "speed/wps": 5505.37746132704, "speed/FLOPS": 243309504714312.94, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04320606589317322, "optim/lr": 2.531654549936957e-05, "optim/total_tokens": 1945016205312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2861675024032593, "created_at": "2025-06-03T05:07:13.679647+00:00"} {"global_step": 231865, "acc_step": 0, "speed/wps": 5511.897995191142, "speed/FLOPS": 243597678935988.44, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04367196559906006, "optim/lr": 2.5312998274275022e-05, "optim/total_tokens": 1945024593920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2877552509307861, "created_at": "2025-06-03T05:07:16.658847+00:00"} {"global_step": 231866, "acc_step": 0, "speed/wps": 5509.899623577517, "speed/FLOPS": 243509361139259.34, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04252259060740471, "optim/lr": 2.5309451049180476e-05, "optim/total_tokens": 1945032982528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3113703727722168, "created_at": "2025-06-03T05:07:19.636187+00:00"} {"global_step": 231867, "acc_step": 0, "speed/wps": 5521.178195560493, "speed/FLOPS": 244007816291942.22, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04534442722797394, "optim/lr": 2.530590382408593e-05, "optim/total_tokens": 1945041371136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3105149269104004, "created_at": "2025-06-03T05:07:22.610884+00:00"} {"global_step": 231868, "acc_step": 0, "speed/wps": 5507.373383165586, "speed/FLOPS": 243397714243522.62, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.042712122201919556, "optim/lr": 2.5302356598991603e-05, "optim/total_tokens": 1945049759744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2974873781204224, "created_at": "2025-06-03T05:07:25.590494+00:00"} {"global_step": 231869, "acc_step": 0, "speed/wps": 5510.224475091929, "speed/FLOPS": 243523717913455.6, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.047629598528146744, "optim/lr": 2.5298809373897057e-05, "optim/total_tokens": 1945058148352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2931705713272095, "created_at": "2025-06-03T05:07:28.567452+00:00"} {"global_step": 231870, "acc_step": 0, "speed/wps": 5511.369760241318, "speed/FLOPS": 243574333654957.75, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.0430101715028286, "optim/lr": 2.529526214880251e-05, "optim/total_tokens": 1945066536960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3078734874725342, "created_at": "2025-06-03T05:07:31.543762+00:00"} {"global_step": 231871, "acc_step": 0, "speed/wps": 5517.376619491882, "speed/FLOPS": 243839806087939.88, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04871821030974388, "optim/lr": 2.5291714923707964e-05, "optim/total_tokens": 1945074925568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3192806243896484, "created_at": "2025-06-03T05:07:34.521495+00:00"} {"global_step": 231872, "acc_step": 0, "speed/wps": 5503.865418152883, "speed/FLOPS": 243242680145353.75, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04211577773094177, "optim/lr": 2.528816769861364e-05, "optim/total_tokens": 1945083314176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2854852676391602, "created_at": "2025-06-03T05:07:37.501814+00:00"} {"global_step": 231873, "acc_step": 0, "speed/wps": 5508.707475755626, "speed/FLOPS": 243456674307497.47, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04884251207113266, "optim/lr": 2.528462047351909e-05, "optim/total_tokens": 1945091702784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2870135307312012, "created_at": "2025-06-03T05:07:40.479616+00:00"} {"global_step": 231874, "acc_step": 0, "speed/wps": 5503.5569394101185, "speed/FLOPS": 243229046963860.9, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.89 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.89, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04155677184462547, "optim/lr": 2.5281073248424545e-05, "optim/total_tokens": 1945100091392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2841651439666748, "created_at": "2025-06-03T05:07:43.461182+00:00"} {"global_step": 231875, "acc_step": 0, "speed/wps": 5528.8190102326735, "speed/FLOPS": 244345501191217.78, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05376981571316719, "optim/lr": 2.527752602333e-05, "optim/total_tokens": 1945108480000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.305119276046753, "created_at": "2025-06-03T05:07:46.431761+00:00"} {"global_step": 231876, "acc_step": 0, "speed/wps": 5496.3799430341005, "speed/FLOPS": 242911860459238.5, "speed/curr_iter_time": 2.9802, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9802, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.9 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.9, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04312862083315849, "optim/lr": 2.5273978798235676e-05, "optim/total_tokens": 1945116868608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2867118120193481, "created_at": "2025-06-03T05:07:49.419673+00:00"} {"global_step": 231877, "acc_step": 0, "speed/wps": 5509.718109561479, "speed/FLOPS": 243501339148823.4, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.054160770028829575, "optim/lr": 2.527043157314113e-05, "optim/total_tokens": 1945125257216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2954463958740234, "created_at": "2025-06-03T05:07:52.399763+00:00"} {"global_step": 231878, "acc_step": 0, "speed/wps": 5519.29638788994, "speed/FLOPS": 243924650024868.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.87 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.87, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04484254866838455, "optim/lr": 2.526688434804658e-05, "optim/total_tokens": 1945133645824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2868613004684448, "created_at": "2025-06-03T05:07:55.372005+00:00"} {"global_step": 231879, "acc_step": 0, "speed/wps": 5525.138897152119, "speed/FLOPS": 244182859029583.6, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04965142533183098, "optim/lr": 2.5263337122952033e-05, "optim/total_tokens": 1945142034432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2833366394042969, "created_at": "2025-06-03T05:07:58.342117+00:00"} {"global_step": 231880, "acc_step": 0, "speed/wps": 5509.765375747963, "speed/FLOPS": 243503428072335.75, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04552149772644043, "optim/lr": 2.525978989785771e-05, "optim/total_tokens": 1945150423040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3057254552841187, "created_at": "2025-06-03T05:08:01.322293+00:00"} {"global_step": 231881, "acc_step": 0, "speed/wps": 5504.96952924601, "speed/FLOPS": 243291476204317.1, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04497188329696655, "optim/lr": 2.5256242672763164e-05, "optim/total_tokens": 1945158811648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3085780143737793, "created_at": "2025-06-03T05:08:04.305486+00:00"} {"global_step": 231882, "acc_step": 0, "speed/wps": 5502.436745026739, "speed/FLOPS": 243179540105790.2, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.25, "optim/grad_norm": 0.04374377056956291, "optim/lr": 2.5252695447668618e-05, "optim/total_tokens": 1945167200256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.286082148551941, "created_at": "2025-06-03T05:08:07.290688+00:00"} {"global_step": 231883, "acc_step": 0, "speed/wps": 5522.168633813582, "speed/FLOPS": 244051588593206.25, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04273180663585663, "optim/lr": 2.5249148222574292e-05, "optim/total_tokens": 1945175588864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2815812826156616, "created_at": "2025-06-03T05:08:10.262840+00:00"} {"global_step": 231884, "acc_step": 0, "speed/wps": 5525.540008771105, "speed/FLOPS": 244200586110067.38, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04282716289162636, "optim/lr": 2.5245600997479745e-05, "optim/total_tokens": 1945183977472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3027244806289673, "created_at": "2025-06-03T05:08:13.235179+00:00"} {"global_step": 231885, "acc_step": 0, "speed/wps": 5508.277281326528, "speed/FLOPS": 243437661915666.06, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045370280742645264, "optim/lr": 2.52420537723852e-05, "optim/total_tokens": 1945192366080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2975600957870483, "created_at": "2025-06-03T05:08:16.216973+00:00"} {"global_step": 231886, "acc_step": 0, "speed/wps": 5510.9539720507855, "speed/FLOPS": 243555957945133.12, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.87 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.87, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045341577380895615, "optim/lr": 2.5238506547290653e-05, "optim/total_tokens": 1945200754688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3056552410125732, "created_at": "2025-06-03T05:08:19.193800+00:00"} {"global_step": 231887, "acc_step": 0, "speed/wps": 5516.157768733615, "speed/FLOPS": 243785939123068.2, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.87 hours", "speed/est_time_elapsed_hrs": 191.27, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.87, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04224632680416107, "optim/lr": 2.5234959322196326e-05, "optim/total_tokens": 1945209143296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2970582246780396, "created_at": "2025-06-03T05:08:22.167630+00:00"} {"global_step": 231888, "acc_step": 0, "speed/wps": 5504.49237541566, "speed/FLOPS": 243270388447310.3, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05346788093447685, "optim/lr": 2.523141209710178e-05, "optim/total_tokens": 1945217531904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2815403938293457, "created_at": "2025-06-03T05:08:25.147972+00:00"} {"global_step": 231889, "acc_step": 0, "speed/wps": 5505.488009826113, "speed/FLOPS": 243314390392133.47, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.88 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.88, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05111774429678917, "optim/lr": 2.5227864872007234e-05, "optim/total_tokens": 1945225920512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2795902490615845, "created_at": "2025-06-03T05:08:28.128153+00:00"} {"global_step": 231890, "acc_step": 0, "speed/wps": 5524.025197108476, "speed/FLOPS": 244133639188088.16, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04460030421614647, "optim/lr": 2.5224317646912687e-05, "optim/total_tokens": 1945234309120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.300015926361084, "created_at": "2025-06-03T05:08:31.098040+00:00"} {"global_step": 231891, "acc_step": 0, "speed/wps": 5527.520374424426, "speed/FLOPS": 244288108135513.88, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04423454776406288, "optim/lr": 2.522077042181836e-05, "optim/total_tokens": 1945242697728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2831077575683594, "created_at": "2025-06-03T05:08:34.069757+00:00"} {"global_step": 231892, "acc_step": 0, "speed/wps": 5523.790735875951, "speed/FLOPS": 244123277201691.94, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044582001864910126, "optim/lr": 2.5217223196723815e-05, "optim/total_tokens": 1945251086336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3063663244247437, "created_at": "2025-06-03T05:08:37.039639+00:00"} {"global_step": 231893, "acc_step": 0, "speed/wps": 5515.414945844671, "speed/FLOPS": 243753110153489.1, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04436635971069336, "optim/lr": 2.5213675971629268e-05, "optim/total_tokens": 1945259474944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2897624969482422, "created_at": "2025-06-03T05:08:40.015862+00:00"} {"global_step": 231894, "acc_step": 0, "speed/wps": 5513.217020788568, "speed/FLOPS": 243655973116009.62, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04381108283996582, "optim/lr": 2.5210128746534722e-05, "optim/total_tokens": 1945267863552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.292401909828186, "created_at": "2025-06-03T05:08:42.992755+00:00"} {"global_step": 231895, "acc_step": 0, "speed/wps": 5514.681219759007, "speed/FLOPS": 243720683216053.3, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04518520459532738, "optim/lr": 2.5206581521440396e-05, "optim/total_tokens": 1945276252160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2946877479553223, "created_at": "2025-06-03T05:08:45.967875+00:00"} {"global_step": 231896, "acc_step": 0, "speed/wps": 5522.197097302719, "speed/FLOPS": 244052846533736.75, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042109329253435135, "optim/lr": 2.520303429634585e-05, "optim/total_tokens": 1945284640768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3087421655654907, "created_at": "2025-06-03T05:08:48.938442+00:00"} {"global_step": 231897, "acc_step": 0, "speed/wps": 5515.463964665286, "speed/FLOPS": 243755276534459.2, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04464561119675636, "optim/lr": 2.5199487071251303e-05, "optim/total_tokens": 1945293029376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2810559272766113, "created_at": "2025-06-03T05:08:51.914859+00:00"} {"global_step": 231898, "acc_step": 0, "speed/wps": 5520.466766142494, "speed/FLOPS": 243976374753092.53, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04206438362598419, "optim/lr": 2.5195939846156757e-05, "optim/total_tokens": 1945301417984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3042197227478027, "created_at": "2025-06-03T05:08:54.886428+00:00"} {"global_step": 231899, "acc_step": 0, "speed/wps": 5525.491828116239, "speed/FLOPS": 244198456771733.25, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04432493820786476, "optim/lr": 2.5192392621062434e-05, "optim/total_tokens": 1945309806592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.313264012336731, "created_at": "2025-06-03T05:08:57.855151+00:00"} {"global_step": 231900, "acc_step": 0, "speed/wps": 5527.634393184654, "speed/FLOPS": 244293147181115.03, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04161262884736061, "optim/lr": 2.5188845395967884e-05, "optim/total_tokens": 1945318195200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2813044786453247, "created_at": "2025-06-03T05:09:00.823463+00:00"} {"global_step": 231901, "acc_step": 0, "speed/wps": 5514.613913431438, "speed/FLOPS": 243717708620879.75, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04338737949728966, "optim/lr": 2.5185298170873338e-05, "optim/total_tokens": 1945326583808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3002800941467285, "created_at": "2025-06-03T05:09:03.800422+00:00"} {"global_step": 231902, "acc_step": 0, "speed/wps": 5518.575813356605, "speed/FLOPS": 243892804318730.0, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.053819671273231506, "optim/lr": 2.518175094577879e-05, "optim/total_tokens": 1945334972416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.290464162826538, "created_at": "2025-06-03T05:09:06.778691+00:00"} {"global_step": 231903, "acc_step": 0, "speed/wps": 5506.658142702093, "speed/FLOPS": 243366104275968.78, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04217131808400154, "optim/lr": 2.517820372068447e-05, "optim/total_tokens": 1945343361024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2980048656463623, "created_at": "2025-06-03T05:09:09.758857+00:00"} {"global_step": 231904, "acc_step": 0, "speed/wps": 5515.742451954041, "speed/FLOPS": 243767584247195.0, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04164664447307587, "optim/lr": 2.5174656495589922e-05, "optim/total_tokens": 1945351749632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.284743309020996, "created_at": "2025-06-03T05:09:12.735502+00:00"} {"global_step": 231905, "acc_step": 0, "speed/wps": 5517.70841342052, "speed/FLOPS": 243854469681310.38, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04359949380159378, "optim/lr": 2.5171109270495372e-05, "optim/total_tokens": 1945360138240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2862581014633179, "created_at": "2025-06-03T05:09:15.715030+00:00"} {"global_step": 231906, "acc_step": 0, "speed/wps": 5512.758576203917, "speed/FLOPS": 243635712211900.16, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042707979679107666, "optim/lr": 2.5167562045400826e-05, "optim/total_tokens": 1945368526848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.280941128730774, "created_at": "2025-06-03T05:09:18.691509+00:00"} {"global_step": 231907, "acc_step": 0, "speed/wps": 5521.60661519229, "speed/FLOPS": 244026750246817.2, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04220651090145111, "optim/lr": 2.5164014820306503e-05, "optim/total_tokens": 1945376915456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2986183166503906, "created_at": "2025-06-03T05:09:21.663026+00:00"} {"global_step": 231908, "acc_step": 0, "speed/wps": 5520.680334020564, "speed/FLOPS": 243985813360163.75, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04323160648345947, "optim/lr": 2.5160467595211957e-05, "optim/total_tokens": 1945385304064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.294068455696106, "created_at": "2025-06-03T05:09:24.634942+00:00"} {"global_step": 231909, "acc_step": 0, "speed/wps": 5509.353727190143, "speed/FLOPS": 243485235313088.44, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043485209345817566, "optim/lr": 2.515692037011741e-05, "optim/total_tokens": 1945393692672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2793126106262207, "created_at": "2025-06-03T05:09:27.612260+00:00"} {"global_step": 231910, "acc_step": 0, "speed/wps": 5508.07320123253, "speed/FLOPS": 243428642620087.94, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0469190813601017, "optim/lr": 2.5153373145023084e-05, "optim/total_tokens": 1945402081280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2941789627075195, "created_at": "2025-06-03T05:09:30.590831+00:00"} {"global_step": 231911, "acc_step": 0, "speed/wps": 5495.109096259501, "speed/FLOPS": 242855695536584.66, "speed/curr_iter_time": 2.9808, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9808, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.87 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.87, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.050884608179330826, "optim/lr": 2.5149825919928538e-05, "optim/total_tokens": 1945410469888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2912697792053223, "created_at": "2025-06-03T05:09:33.576307+00:00"} {"global_step": 231912, "acc_step": 0, "speed/wps": 5503.100706707159, "speed/FLOPS": 243208883813600.75, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.86 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.86, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042110055685043335, "optim/lr": 2.514627869483399e-05, "optim/total_tokens": 1945418858496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2988200187683105, "created_at": "2025-06-03T05:09:36.559100+00:00"} {"global_step": 231913, "acc_step": 0, "speed/wps": 5511.792342604776, "speed/FLOPS": 243593009632450.03, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.054861199110746384, "optim/lr": 2.5142731469739445e-05, "optim/total_tokens": 1945427247104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.285034418106079, "created_at": "2025-06-03T05:09:39.535315+00:00"} {"global_step": 231914, "acc_step": 0, "speed/wps": 5515.0814436963465, "speed/FLOPS": 243738371065551.88, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04337102547287941, "optim/lr": 2.513918424464512e-05, "optim/total_tokens": 1945435635712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2980589866638184, "created_at": "2025-06-03T05:09:42.513814+00:00"} {"global_step": 231915, "acc_step": 0, "speed/wps": 5516.741638187054, "speed/FLOPS": 243811743164395.44, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.054293155670166016, "optim/lr": 2.5135637019550572e-05, "optim/total_tokens": 1945444024320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.306728720664978, "created_at": "2025-06-03T05:09:45.493310+00:00"} {"global_step": 231916, "acc_step": 0, "speed/wps": 5520.459303688027, "speed/FLOPS": 243976044950801.4, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04357267543673515, "optim/lr": 2.5132089794456026e-05, "optim/total_tokens": 1945452412928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.291662573814392, "created_at": "2025-06-03T05:09:48.465792+00:00"} {"global_step": 231917, "acc_step": 0, "speed/wps": 5519.668611793066, "speed/FLOPS": 243941100416172.12, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05246605724096298, "optim/lr": 2.512854256936148e-05, "optim/total_tokens": 1945460801536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2915103435516357, "created_at": "2025-06-03T05:09:51.437801+00:00"} {"global_step": 231918, "acc_step": 0, "speed/wps": 5520.299208128545, "speed/FLOPS": 243968969546515.66, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04670095816254616, "optim/lr": 2.5124995344267153e-05, "optim/total_tokens": 1945469190144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.279181718826294, "created_at": "2025-06-03T05:09:54.411085+00:00"} {"global_step": 231919, "acc_step": 0, "speed/wps": 5521.283117887226, "speed/FLOPS": 244012453321742.66, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045188501477241516, "optim/lr": 2.5121448119172607e-05, "optim/total_tokens": 1945477578752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.303796410560608, "created_at": "2025-06-03T05:09:57.382001+00:00"} {"global_step": 231920, "acc_step": 0, "speed/wps": 5516.811448363035, "speed/FLOPS": 243814828416852.9, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042762964963912964, "optim/lr": 2.511790089407806e-05, "optim/total_tokens": 1945485967360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2891318798065186, "created_at": "2025-06-03T05:10:00.355350+00:00"} {"global_step": 231921, "acc_step": 0, "speed/wps": 5521.197288275807, "speed/FLOPS": 244008660092233.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04533166065812111, "optim/lr": 2.5114353668983514e-05, "optim/total_tokens": 1945494355968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2892450094223022, "created_at": "2025-06-03T05:10:03.328244+00:00"} {"global_step": 231922, "acc_step": 0, "speed/wps": 5520.613472800298, "speed/FLOPS": 243982858436454.72, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04353226721286774, "optim/lr": 2.5110806443889188e-05, "optim/total_tokens": 1945502744576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3032057285308838, "created_at": "2025-06-03T05:10:06.299918+00:00"} {"global_step": 231923, "acc_step": 0, "speed/wps": 5521.446692662145, "speed/FLOPS": 244019682489542.5, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.047416284680366516, "optim/lr": 2.510725921879464e-05, "optim/total_tokens": 1945511133184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2860584259033203, "created_at": "2025-06-03T05:10:09.271004+00:00"} {"global_step": 231924, "acc_step": 0, "speed/wps": 5515.951098935149, "speed/FLOPS": 243776805375807.94, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04790931195020676, "optim/lr": 2.5103711993700095e-05, "optim/total_tokens": 1945519521792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3094213008880615, "created_at": "2025-06-03T05:10:12.245021+00:00"} {"global_step": 231925, "acc_step": 0, "speed/wps": 5512.393509598446, "speed/FLOPS": 243619578136518.6, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04299827665090561, "optim/lr": 2.510016476860555e-05, "optim/total_tokens": 1945527910400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2801457643508911, "created_at": "2025-06-03T05:10:15.224717+00:00"} {"global_step": 231926, "acc_step": 0, "speed/wps": 5515.479427181812, "speed/FLOPS": 243755959898545.3, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045713312923908234, "optim/lr": 2.5096617543511223e-05, "optim/total_tokens": 1945536299008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.299436092376709, "created_at": "2025-06-03T05:10:18.201886+00:00"} {"global_step": 231927, "acc_step": 0, "speed/wps": 5504.22670992733, "speed/FLOPS": 243258647392525.4, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.85 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.85, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04341447353363037, "optim/lr": 2.5093070318416676e-05, "optim/total_tokens": 1945544687616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2886357307434082, "created_at": "2025-06-03T05:10:21.182308+00:00"} {"global_step": 231928, "acc_step": 0, "speed/wps": 5512.524786656885, "speed/FLOPS": 243625379910564.72, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04210976883769035, "optim/lr": 2.508952309332213e-05, "optim/total_tokens": 1945553076224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2952651977539062, "created_at": "2025-06-03T05:10:24.160108+00:00"} {"global_step": 231929, "acc_step": 0, "speed/wps": 5518.838344929529, "speed/FLOPS": 243904406870494.84, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046775758266448975, "optim/lr": 2.5085975868227584e-05, "optim/total_tokens": 1945561464832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2890143394470215, "created_at": "2025-06-03T05:10:27.136102+00:00"} {"global_step": 231930, "acc_step": 0, "speed/wps": 5511.5518398243175, "speed/FLOPS": 243582380640558.56, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04158533737063408, "optim/lr": 2.508242864313326e-05, "optim/total_tokens": 1945569853440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2856734991073608, "created_at": "2025-06-03T05:10:30.115624+00:00"} {"global_step": 231931, "acc_step": 0, "speed/wps": 5519.519296260273, "speed/FLOPS": 243934501433888.88, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.047781191766262054, "optim/lr": 2.507888141803871e-05, "optim/total_tokens": 1945578242048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3078590631484985, "created_at": "2025-06-03T05:10:33.087845+00:00"} {"global_step": 231932, "acc_step": 0, "speed/wps": 5519.241440866981, "speed/FLOPS": 243922221647698.2, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04182916879653931, "optim/lr": 2.5075334192944165e-05, "optim/total_tokens": 1945586630656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3062736988067627, "created_at": "2025-06-03T05:10:36.060753+00:00"} {"global_step": 231933, "acc_step": 0, "speed/wps": 5523.026764748107, "speed/FLOPS": 244089513588199.94, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04631593078374863, "optim/lr": 2.5071786967849618e-05, "optim/total_tokens": 1945595019264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2860984802246094, "created_at": "2025-06-03T05:10:39.035078+00:00"} {"global_step": 231934, "acc_step": 0, "speed/wps": 5526.4166210472085, "speed/FLOPS": 244239327885762.78, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.041673507541418076, "optim/lr": 2.5068239742755295e-05, "optim/total_tokens": 1945603407872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2864571809768677, "created_at": "2025-06-03T05:10:42.004223+00:00"} {"global_step": 231935, "acc_step": 0, "speed/wps": 5513.559930647017, "speed/FLOPS": 243671127976581.28, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05259265750646591, "optim/lr": 2.506469251766075e-05, "optim/total_tokens": 1945611796480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.302923560142517, "created_at": "2025-06-03T05:10:44.979461+00:00"} {"global_step": 231936, "acc_step": 0, "speed/wps": 5522.432437836435, "speed/FLOPS": 244063247380744.94, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044086094945669174, "optim/lr": 2.50611452925662e-05, "optim/total_tokens": 1945620185088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2688724994659424, "created_at": "2025-06-03T05:10:47.954461+00:00"} {"global_step": 231937, "acc_step": 0, "speed/wps": 5519.530423145505, "speed/FLOPS": 243934993185263.53, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04569259285926819, "optim/lr": 2.5057598067471876e-05, "optim/total_tokens": 1945628573696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2955989837646484, "created_at": "2025-06-03T05:10:50.926593+00:00"} {"global_step": 231938, "acc_step": 0, "speed/wps": 5521.030595575093, "speed/FLOPS": 244001293128072.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.14, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04299016296863556, "optim/lr": 2.505405084237733e-05, "optim/total_tokens": 1945636962304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.289845585823059, "created_at": "2025-06-03T05:10:53.901769+00:00"} {"global_step": 231939, "acc_step": 0, "speed/wps": 5516.4045523324785, "speed/FLOPS": 243796845694985.0, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04428248479962349, "optim/lr": 2.5050503617282784e-05, "optim/total_tokens": 1945645350912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2832695245742798, "created_at": "2025-06-03T05:10:56.880849+00:00"} {"global_step": 231940, "acc_step": 0, "speed/wps": 5504.314111228821, "speed/FLOPS": 243262510082690.88, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.84 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.84, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042953889816999435, "optim/lr": 2.5046956392188237e-05, "optim/total_tokens": 1945653739520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3051495552062988, "created_at": "2025-06-03T05:10:59.861399+00:00"} {"global_step": 231941, "acc_step": 0, "speed/wps": 5532.245101290594, "speed/FLOPS": 244496916879654.12, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 190.76, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042950332164764404, "optim/lr": 2.504340916709391e-05, "optim/total_tokens": 1945662128128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3122599124908447, "created_at": "2025-06-03T05:11:02.826728+00:00"} {"global_step": 231942, "acc_step": 0, "speed/wps": 5523.548574001166, "speed/FLOPS": 244112574886323.28, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04426465183496475, "optim/lr": 2.5039861941999365e-05, "optim/total_tokens": 1945670516736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.30451238155365, "created_at": "2025-06-03T05:11:05.796811+00:00"} {"global_step": 231943, "acc_step": 0, "speed/wps": 5534.805858941847, "speed/FLOPS": 244610089260693.66, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043298352509737015, "optim/lr": 2.5036314716904818e-05, "optim/total_tokens": 1945678905344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.300272822380066, "created_at": "2025-06-03T05:11:08.765000+00:00"} {"global_step": 231944, "acc_step": 0, "speed/wps": 5513.385355208745, "speed/FLOPS": 243663412635767.75, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04592178761959076, "optim/lr": 2.5032767491810272e-05, "optim/total_tokens": 1945687293952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.290536880493164, "created_at": "2025-06-03T05:11:11.742012+00:00"} {"global_step": 231945, "acc_step": 0, "speed/wps": 5510.1256334247155, "speed/FLOPS": 243519349617682.25, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045499857515096664, "optim/lr": 2.5029220266715946e-05, "optim/total_tokens": 1945695682560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3066858053207397, "created_at": "2025-06-03T05:11:14.720148+00:00"} {"global_step": 231946, "acc_step": 0, "speed/wps": 5516.268447902461, "speed/FLOPS": 243790830575823.84, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04351801797747612, "optim/lr": 2.50256730416214e-05, "optim/total_tokens": 1945704071168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2915410995483398, "created_at": "2025-06-03T05:11:17.698393+00:00"} {"global_step": 231947, "acc_step": 0, "speed/wps": 5514.754454747446, "speed/FLOPS": 243723919827691.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04634340852499008, "optim/lr": 2.5022125816526853e-05, "optim/total_tokens": 1945712459776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2914741039276123, "created_at": "2025-06-03T05:11:20.673060+00:00"} {"global_step": 231948, "acc_step": 0, "speed/wps": 5502.359696121759, "speed/FLOPS": 243176134938562.1, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.83 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.83, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04436749219894409, "optim/lr": 2.5018578591432307e-05, "optim/total_tokens": 1945720848384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2954541444778442, "created_at": "2025-06-03T05:11:23.658887+00:00"} {"global_step": 231949, "acc_step": 0, "speed/wps": 5509.943085470186, "speed/FLOPS": 243511281932457.2, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05038665980100632, "optim/lr": 2.501503136633798e-05, "optim/total_tokens": 1945729236992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3066391944885254, "created_at": "2025-06-03T05:11:26.639774+00:00"} {"global_step": 231950, "acc_step": 0, "speed/wps": 5516.557215371387, "speed/FLOPS": 243803592619904.5, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042883019894361496, "optim/lr": 2.5011484141243434e-05, "optim/total_tokens": 1945737625600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3019967079162598, "created_at": "2025-06-03T05:11:29.616436+00:00"} {"global_step": 231951, "acc_step": 0, "speed/wps": 5517.180803173446, "speed/FLOPS": 243831152008943.78, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046214427798986435, "optim/lr": 2.5007936916148888e-05, "optim/total_tokens": 1945746014208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2908895015716553, "created_at": "2025-06-03T05:11:32.589874+00:00"} {"global_step": 231952, "acc_step": 0, "speed/wps": 5530.022504082338, "speed/FLOPS": 244398689459333.0, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04136011376976967, "optim/lr": 2.500438969105434e-05, "optim/total_tokens": 1945754402816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2938534021377563, "created_at": "2025-06-03T05:11:35.562287+00:00"} {"global_step": 231953, "acc_step": 0, "speed/wps": 5511.1436263108035, "speed/FLOPS": 243564339692687.4, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.82 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.82, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05072086304426193, "optim/lr": 2.5000842465960015e-05, "optim/total_tokens": 1945762791424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.290116548538208, "created_at": "2025-06-03T05:11:38.538928+00:00"} {"global_step": 231954, "acc_step": 0, "speed/wps": 5516.986307882644, "speed/FLOPS": 243822556312607.47, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04234229400753975, "optim/lr": 2.499729524086547e-05, "optim/total_tokens": 1945771180032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3015964031219482, "created_at": "2025-06-03T05:11:41.516976+00:00"} {"global_step": 231955, "acc_step": 0, "speed/wps": 5515.331404205796, "speed/FLOPS": 243749418040655.72, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0461294949054718, "optim/lr": 2.4993748015770922e-05, "optim/total_tokens": 1945779568640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2966209650039673, "created_at": "2025-06-03T05:11:44.491518+00:00"} {"global_step": 231956, "acc_step": 0, "speed/wps": 5520.420327838385, "speed/FLOPS": 243974322417743.7, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04227113351225853, "optim/lr": 2.4990200790676376e-05, "optim/total_tokens": 1945787957248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3001410961151123, "created_at": "2025-06-03T05:11:47.468114+00:00"} {"global_step": 231957, "acc_step": 0, "speed/wps": 5515.97165111338, "speed/FLOPS": 243777713676890.16, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04413355514407158, "optim/lr": 2.4986653565582053e-05, "optim/total_tokens": 1945796345856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2884740829467773, "created_at": "2025-06-03T05:11:50.442915+00:00"} {"global_step": 231958, "acc_step": 0, "speed/wps": 5526.533054825171, "speed/FLOPS": 244244473662786.66, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04233258590102196, "optim/lr": 2.4983106340487503e-05, "optim/total_tokens": 1945804734464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.297098159790039, "created_at": "2025-06-03T05:11:53.416653+00:00"} {"global_step": 231959, "acc_step": 0, "speed/wps": 5514.726815608185, "speed/FLOPS": 243722698319206.22, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044863149523735046, "optim/lr": 2.4979559115392957e-05, "optim/total_tokens": 1945813123072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.293912649154663, "created_at": "2025-06-03T05:11:56.392928+00:00"} {"global_step": 231960, "acc_step": 0, "speed/wps": 5528.126361894593, "speed/FLOPS": 244314889679970.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04261365905404091, "optim/lr": 2.497601189029841e-05, "optim/total_tokens": 1945821511680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3083550930023193, "created_at": "2025-06-03T05:11:59.360422+00:00"} {"global_step": 231961, "acc_step": 0, "speed/wps": 5518.339333083225, "speed/FLOPS": 243882353101062.38, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0462193600833416, "optim/lr": 2.4972464665204088e-05, "optim/total_tokens": 1945829900288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2878257036209106, "created_at": "2025-06-03T05:12:02.333476+00:00"} {"global_step": 231962, "acc_step": 0, "speed/wps": 5528.589343340478, "speed/FLOPS": 244335351090124.47, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042820654809474945, "optim/lr": 2.496891744010954e-05, "optim/total_tokens": 1945838288896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.292667269706726, "created_at": "2025-06-03T05:12:05.300820+00:00"} {"global_step": 231963, "acc_step": 0, "speed/wps": 5522.661310871356, "speed/FLOPS": 244073362397410.06, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043219756335020065, "optim/lr": 2.496537021501499e-05, "optim/total_tokens": 1945846677504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3055745363235474, "created_at": "2025-06-03T05:12:08.271272+00:00"} {"global_step": 231964, "acc_step": 0, "speed/wps": 5525.413198529772, "speed/FLOPS": 244194981746474.12, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.041993021965026855, "optim/lr": 2.496182298992067e-05, "optim/total_tokens": 1945855066112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2833412885665894, "created_at": "2025-06-03T05:12:11.240262+00:00"} {"global_step": 231965, "acc_step": 0, "speed/wps": 5515.054332495946, "speed/FLOPS": 243737172889261.9, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045513756573200226, "optim/lr": 2.4958275764826122e-05, "optim/total_tokens": 1945863454720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2800594568252563, "created_at": "2025-06-03T05:12:14.215078+00:00"} {"global_step": 231966, "acc_step": 0, "speed/wps": 5523.453363388557, "speed/FLOPS": 244108367064578.03, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04564770311117172, "optim/lr": 2.4954728539731576e-05, "optim/total_tokens": 1945871843328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3025676012039185, "created_at": "2025-06-03T05:12:17.185247+00:00"} {"global_step": 231967, "acc_step": 0, "speed/wps": 5510.6751079995365, "speed/FLOPS": 243543633581423.53, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04798088222742081, "optim/lr": 2.495118131463703e-05, "optim/total_tokens": 1945880231936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2987383604049683, "created_at": "2025-06-03T05:12:20.163171+00:00"} {"global_step": 231968, "acc_step": 0, "speed/wps": 5527.114822814321, "speed/FLOPS": 244270184830148.56, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05495923385024071, "optim/lr": 2.4947634089542703e-05, "optim/total_tokens": 1945888620544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.302176833152771, "created_at": "2025-06-03T05:12:23.134151+00:00"} {"global_step": 231969, "acc_step": 0, "speed/wps": 5522.9984821366925, "speed/FLOPS": 244088263641538.94, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043442174792289734, "optim/lr": 2.4944086864448157e-05, "optim/total_tokens": 1945897009152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.302081823348999, "created_at": "2025-06-03T05:12:26.104890+00:00"} {"global_step": 231970, "acc_step": 0, "speed/wps": 5523.307822386403, "speed/FLOPS": 244101934897229.22, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05553756654262543, "optim/lr": 2.494053963935361e-05, "optim/total_tokens": 1945905397760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2927218675613403, "created_at": "2025-06-03T05:12:29.075759+00:00"} {"global_step": 231971, "acc_step": 0, "speed/wps": 5525.385748770908, "speed/FLOPS": 244193768607632.94, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04278663173317909, "optim/lr": 2.4936992414259064e-05, "optim/total_tokens": 1945913786368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2991547584533691, "created_at": "2025-06-03T05:12:32.045207+00:00"} {"global_step": 231972, "acc_step": 0, "speed/wps": 5515.151666588468, "speed/FLOPS": 243741474557950.3, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05248691886663437, "optim/lr": 2.4933445189164738e-05, "optim/total_tokens": 1945922174976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.291791319847107, "created_at": "2025-06-03T05:12:35.021060+00:00"} {"global_step": 231973, "acc_step": 0, "speed/wps": 5505.357928273022, "speed/FLOPS": 243308641453304.56, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.81 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.81, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04209446907043457, "optim/lr": 2.4929897964070192e-05, "optim/total_tokens": 1945930563584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2811341285705566, "created_at": "2025-06-03T05:12:38.004334+00:00"} {"global_step": 231974, "acc_step": 0, "speed/wps": 5508.718283097004, "speed/FLOPS": 243457151936669.4, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05723606050014496, "optim/lr": 2.4926350738975645e-05, "optim/total_tokens": 1945938952192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2887132167816162, "created_at": "2025-06-03T05:12:40.983690+00:00"} {"global_step": 231975, "acc_step": 0, "speed/wps": 5517.700378238219, "speed/FLOPS": 243854114567380.47, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04226414114236832, "optim/lr": 2.49228035138811e-05, "optim/total_tokens": 1945947340800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2957004308700562, "created_at": "2025-06-03T05:12:43.961890+00:00"} {"global_step": 231976, "acc_step": 0, "speed/wps": 5519.906297160173, "speed/FLOPS": 243951604892814.28, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.056636977940797806, "optim/lr": 2.4919256288786773e-05, "optim/total_tokens": 1945955729408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3034021854400635, "created_at": "2025-06-03T05:12:46.934825+00:00"} {"global_step": 231977, "acc_step": 0, "speed/wps": 5522.599196561918, "speed/FLOPS": 244070617262862.75, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04490534961223602, "optim/lr": 2.4915709063692226e-05, "optim/total_tokens": 1945964118016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3029241561889648, "created_at": "2025-06-03T05:12:49.905266+00:00"} {"global_step": 231978, "acc_step": 0, "speed/wps": 5527.322740747736, "speed/FLOPS": 244279373738585.03, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 190.96, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04761893302202225, "optim/lr": 2.491216183859768e-05, "optim/total_tokens": 1945972506624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.307464838027954, "created_at": "2025-06-03T05:12:52.877571+00:00"} {"global_step": 231979, "acc_step": 0, "speed/wps": 5530.572678172661, "speed/FLOPS": 244423004338079.0, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.77 hours", "speed/est_time_elapsed_hrs": 190.8, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.77, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04342903196811676, "optim/lr": 2.4908614613503134e-05, "optim/total_tokens": 1945980895232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2836217880249023, "created_at": "2025-06-03T05:12:55.846419+00:00"} {"global_step": 231980, "acc_step": 0, "speed/wps": 5515.709466130562, "speed/FLOPS": 243766126442634.0, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04751807823777199, "optim/lr": 2.4905067388408807e-05, "optim/total_tokens": 1945989283840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2913613319396973, "created_at": "2025-06-03T05:12:58.820541+00:00"} {"global_step": 231981, "acc_step": 0, "speed/wps": 5510.829923108921, "speed/FLOPS": 243550475616842.78, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.8 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.8, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04236435145139694, "optim/lr": 2.490152016331426e-05, "optim/total_tokens": 1945997672448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3046801090240479, "created_at": "2025-06-03T05:13:01.801958+00:00"} {"global_step": 231982, "acc_step": 0, "speed/wps": 5509.4025766470995, "speed/FLOPS": 243487394209051.72, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.053725190460681915, "optim/lr": 2.4897972938219715e-05, "optim/total_tokens": 1946006061056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2995957136154175, "created_at": "2025-06-03T05:13:04.780406+00:00"} {"global_step": 231983, "acc_step": 0, "speed/wps": 5517.185228350119, "speed/FLOPS": 243831347579102.62, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04393506795167923, "optim/lr": 2.4894425713125168e-05, "optim/total_tokens": 1946014449664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.289334774017334, "created_at": "2025-06-03T05:13:07.754500+00:00"} {"global_step": 231984, "acc_step": 0, "speed/wps": 5521.7987655756115, "speed/FLOPS": 244035242310245.2, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0529879666864872, "optim/lr": 2.4890878488030842e-05, "optim/total_tokens": 1946022838272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3174577951431274, "created_at": "2025-06-03T05:13:10.726024+00:00"} {"global_step": 231985, "acc_step": 0, "speed/wps": 5523.779556251785, "speed/FLOPS": 244122783119526.28, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042248744517564774, "optim/lr": 2.4887331262936296e-05, "optim/total_tokens": 1946031226880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.286198377609253, "created_at": "2025-06-03T05:13:13.700789+00:00"} {"global_step": 231986, "acc_step": 0, "speed/wps": 5514.861271612867, "speed/FLOPS": 243728640586405.0, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.050498414784669876, "optim/lr": 2.488378403784175e-05, "optim/total_tokens": 1946039615488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2802026271820068, "created_at": "2025-06-03T05:13:16.680529+00:00"} {"global_step": 231987, "acc_step": 0, "speed/wps": 5511.97698104383, "speed/FLOPS": 243601169706391.0, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04310781881213188, "optim/lr": 2.4880236812747203e-05, "optim/total_tokens": 1946048004096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2815420627593994, "created_at": "2025-06-03T05:13:19.659833+00:00"} {"global_step": 231988, "acc_step": 0, "speed/wps": 5507.846156073029, "speed/FLOPS": 243418608386160.5, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04872949793934822, "optim/lr": 2.487668958765288e-05, "optim/total_tokens": 1946056392704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3055561780929565, "created_at": "2025-06-03T05:13:22.638768+00:00"} {"global_step": 231989, "acc_step": 0, "speed/wps": 5508.8355024157045, "speed/FLOPS": 243462332430573.1, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04355236142873764, "optim/lr": 2.487314236255833e-05, "optim/total_tokens": 1946064781312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2894465923309326, "created_at": "2025-06-03T05:13:25.619495+00:00"} {"global_step": 231990, "acc_step": 0, "speed/wps": 5511.713038260169, "speed/FLOPS": 243589504786334.8, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04620252922177315, "optim/lr": 2.4869595137463784e-05, "optim/total_tokens": 1946073169920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2847634553909302, "created_at": "2025-06-03T05:13:28.595899+00:00"} {"global_step": 231991, "acc_step": 0, "speed/wps": 5510.2146641598, "speed/FLOPS": 243523284320472.4, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044124942272901535, "optim/lr": 2.486604791236946e-05, "optim/total_tokens": 1946081558528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2869343757629395, "created_at": "2025-06-03T05:13:31.572733+00:00"} {"global_step": 231992, "acc_step": 0, "speed/wps": 5506.830123418004, "speed/FLOPS": 243373704943334.97, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.79 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.79, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0463983528316021, "optim/lr": 2.4862500687274915e-05, "optim/total_tokens": 1946089947136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3089189529418945, "created_at": "2025-06-03T05:13:34.557194+00:00"} {"global_step": 231993, "acc_step": 0, "speed/wps": 5512.748255704419, "speed/FLOPS": 243635256098647.4, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04374022036790848, "optim/lr": 2.485895346218037e-05, "optim/total_tokens": 1946098335744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2972562313079834, "created_at": "2025-06-03T05:13:37.533145+00:00"} {"global_step": 231994, "acc_step": 0, "speed/wps": 5522.97681640879, "speed/FLOPS": 244087306127260.9, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.77 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.77, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043336860835552216, "optim/lr": 2.4855406237085822e-05, "optim/total_tokens": 1946106724352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3073543310165405, "created_at": "2025-06-03T05:13:40.508209+00:00"} {"global_step": 231995, "acc_step": 0, "speed/wps": 5515.426397699583, "speed/FLOPS": 243753616266860.28, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04446008801460266, "optim/lr": 2.4851859011991496e-05, "optim/total_tokens": 1946115112960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2909002304077148, "created_at": "2025-06-03T05:13:43.488174+00:00"} {"global_step": 231996, "acc_step": 0, "speed/wps": 5508.938122793027, "speed/FLOPS": 243466867725992.06, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0455736368894577, "optim/lr": 2.484831178689695e-05, "optim/total_tokens": 1946123501568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2951432466506958, "created_at": "2025-06-03T05:13:46.469424+00:00"} {"global_step": 231997, "acc_step": 0, "speed/wps": 5524.2248861351045, "speed/FLOPS": 244142464420964.03, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.77 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.77, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04274633899331093, "optim/lr": 2.4844764561802403e-05, "optim/total_tokens": 1946131890176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.273829460144043, "created_at": "2025-06-03T05:13:49.442554+00:00"} {"global_step": 231998, "acc_step": 0, "speed/wps": 5512.61345013093, "speed/FLOPS": 243629298382296.7, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044122613966464996, "optim/lr": 2.4841217336707857e-05, "optim/total_tokens": 1946140278784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2962387800216675, "created_at": "2025-06-03T05:13:52.418675+00:00"} {"global_step": 231999, "acc_step": 0, "speed/wps": 5513.480085555481, "speed/FLOPS": 243667599232219.66, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.78 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.78, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04222194105386734, "optim/lr": 2.483767011161353e-05, "optim/total_tokens": 1946148667392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.305695652961731, "created_at": "2025-06-03T05:13:55.396835+00:00"} {"global_step": 232000, "acc_step": 0, "speed/wps": 5524.675906548002, "speed/FLOPS": 244162397214682.34, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.77 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.77, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04386298730969429, "optim/lr": 2.4834122886518984e-05, "optim/total_tokens": 1946157056000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2977104187011719, "created_at": "2025-06-03T05:13:58.369774+00:00"} {"global_step": 232001, "acc_step": 0, "speed/wps": 216.94964664873072, "speed/FLOPS": 9588063932917.713, "speed/curr_iter_time": 6.0092, "speed/data_load_time": 3.4645, "speed/curr_step_time": 6.0092, "speed/est_time_elapsed": "16.14 days", "speed/est_time_remaining": "11.68 hours", "speed/est_time_elapsed_hrs": 387.26, "speed/est_time_elapsed_days": 16.14, "speed/est_time_remaining_hrs": 11.68, "speed/est_time_remaining_days": 0.49, "optim/grad_norm": 0.04240504279732704, "optim/lr": 2.4830575661424438e-05, "optim/total_tokens": 1946165444608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2972749471664429, "created_at": "2025-06-03T05:15:13.912302+00:00"} {"global_step": 232002, "acc_step": 0, "speed/wps": 5621.875743597731, "speed/FLOPS": 248458132498413.66, "speed/curr_iter_time": 2.9111, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9111, "speed/est_time_elapsed": "7.82 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 187.61, "speed/est_time_elapsed_days": 7.82, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042862776666879654, "optim/lr": 2.482702843632989e-05, "optim/total_tokens": 1946173833216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3053165674209595, "created_at": "2025-06-03T05:15:16.834707+00:00"} {"global_step": 232003, "acc_step": 0, "speed/wps": 5568.995436350047, "speed/FLOPS": 246121093584014.97, "speed/curr_iter_time": 2.9405, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9405, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 189.5, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04228128120303154, "optim/lr": 2.4823481211235565e-05, "optim/total_tokens": 1946182221824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3123674392700195, "created_at": "2025-06-03T05:15:19.781052+00:00"} {"global_step": 232004, "acc_step": 0, "speed/wps": 5546.81447412684, "speed/FLOPS": 245140808586205.8, "speed/curr_iter_time": 2.9527, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9527, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.29, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043597567826509476, "optim/lr": 2.481993398614102e-05, "optim/total_tokens": 1946190610432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2839329242706299, "created_at": "2025-06-03T05:15:22.743429+00:00"} {"global_step": 232005, "acc_step": 0, "speed/wps": 5542.693521141737, "speed/FLOPS": 244958683557213.75, "speed/curr_iter_time": 2.9541, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9541, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.38, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04314254969358444, "optim/lr": 2.4816386761046472e-05, "optim/total_tokens": 1946198999040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.290210485458374, "created_at": "2025-06-03T05:15:25.707971+00:00"} {"global_step": 232006, "acc_step": 0, "speed/wps": 5538.92496124578, "speed/FLOPS": 244792132499050.62, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.55, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0426553338766098, "optim/lr": 2.4812839535951926e-05, "optim/total_tokens": 1946207387648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2810488939285278, "created_at": "2025-06-03T05:15:28.670534+00:00"} {"global_step": 232007, "acc_step": 0, "speed/wps": 5520.482037580778, "speed/FLOPS": 243977049672498.38, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.76 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.76, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04225873202085495, "optim/lr": 2.48092923108576e-05, "optim/total_tokens": 1946215776256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3044829368591309, "created_at": "2025-06-03T05:15:31.645491+00:00"} {"global_step": 232008, "acc_step": 0, "speed/wps": 5526.401305906986, "speed/FLOPS": 244238651034954.94, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.76 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.76, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04332878068089485, "optim/lr": 2.4805745085763053e-05, "optim/total_tokens": 1946224164864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2866175174713135, "created_at": "2025-06-03T05:15:34.618465+00:00"} {"global_step": 232009, "acc_step": 0, "speed/wps": 5536.6722406506615, "speed/FLOPS": 244692573779215.66, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.59, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042075034230947495, "optim/lr": 2.4802197860668507e-05, "optim/total_tokens": 1946232553472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2824803590774536, "created_at": "2025-06-03T05:15:37.583966+00:00"} {"global_step": 232010, "acc_step": 0, "speed/wps": 5556.419264146707, "speed/FLOPS": 245565291143312.0, "speed/curr_iter_time": 2.9478, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9478, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 189.98, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04427470266819, "optim/lr": 2.479865063557396e-05, "optim/total_tokens": 1946240942080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3066612482070923, "created_at": "2025-06-03T05:15:40.537895+00:00"} {"global_step": 232011, "acc_step": 0, "speed/wps": 5516.633737756908, "speed/FLOPS": 243806974517667.44, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.76 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.76, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0452263206243515, "optim/lr": 2.4795103410479634e-05, "optim/total_tokens": 1946249330688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2916371822357178, "created_at": "2025-06-03T05:15:43.514809+00:00"} {"global_step": 232012, "acc_step": 0, "speed/wps": 5533.493569957347, "speed/FLOPS": 244552092804482.7, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.71, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04451558738946915, "optim/lr": 2.4791556185385088e-05, "optim/total_tokens": 1946257719296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3035751581192017, "created_at": "2025-06-03T05:15:46.480382+00:00"} {"global_step": 232013, "acc_step": 0, "speed/wps": 5531.6134801047365, "speed/FLOPS": 244469002456169.53, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.048723254352808, "optim/lr": 2.478800896029054e-05, "optim/total_tokens": 1946266107904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.303253412246704, "created_at": "2025-06-03T05:15:49.451455+00:00"} {"global_step": 232014, "acc_step": 0, "speed/wps": 5530.881657222653, "speed/FLOPS": 244436659630590.53, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04258500784635544, "optim/lr": 2.4784461735195995e-05, "optim/total_tokens": 1946274496512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2949055433273315, "created_at": "2025-06-03T05:15:52.422337+00:00"} {"global_step": 232015, "acc_step": 0, "speed/wps": 5513.132788107743, "speed/FLOPS": 243652250462659.1, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.76 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.76, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04292716830968857, "optim/lr": 2.4780914510101672e-05, "optim/total_tokens": 1946282885120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2972230911254883, "created_at": "2025-06-03T05:15:55.400706+00:00"} {"global_step": 232016, "acc_step": 0, "speed/wps": 5524.597216037321, "speed/FLOPS": 244158919496884.8, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044584013521671295, "optim/lr": 2.4777367285007123e-05, "optim/total_tokens": 1946291273728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3039050102233887, "created_at": "2025-06-03T05:15:58.370895+00:00"} {"global_step": 232017, "acc_step": 0, "speed/wps": 5517.939096558959, "speed/FLOPS": 243864664695286.06, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.76 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.76, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042936477810144424, "optim/lr": 2.4773820059912576e-05, "optim/total_tokens": 1946299662336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3127696514129639, "created_at": "2025-06-03T05:16:01.344459+00:00"} {"global_step": 232018, "acc_step": 0, "speed/wps": 5533.644898382767, "speed/FLOPS": 244558780746317.12, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046127427369356155, "optim/lr": 2.4770272834818253e-05, "optim/total_tokens": 1946308050944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.289664387702942, "created_at": "2025-06-03T05:16:04.313389+00:00"} {"global_step": 232019, "acc_step": 0, "speed/wps": 5526.354633164166, "speed/FLOPS": 244236588338615.06, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04821188747882843, "optim/lr": 2.4766725609723707e-05, "optim/total_tokens": 1946316439552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.303434133529663, "created_at": "2025-06-03T05:16:07.286744+00:00"} {"global_step": 232020, "acc_step": 0, "speed/wps": 5526.766846482472, "speed/FLOPS": 244254806057385.16, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04349786043167114, "optim/lr": 2.476317838462916e-05, "optim/total_tokens": 1946324828160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2795698642730713, "created_at": "2025-06-03T05:16:10.257488+00:00"} {"global_step": 232021, "acc_step": 0, "speed/wps": 5524.501863443298, "speed/FLOPS": 244154705400287.8, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04874138534069061, "optim/lr": 2.475963115953461e-05, "optim/total_tokens": 1946333216768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2933725118637085, "created_at": "2025-06-03T05:16:13.227342+00:00"} {"global_step": 232022, "acc_step": 0, "speed/wps": 5527.326600433174, "speed/FLOPS": 244279544316925.72, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042148273438215256, "optim/lr": 2.4756083934440288e-05, "optim/total_tokens": 1946341605376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2937400341033936, "created_at": "2025-06-03T05:16:16.199007+00:00"} {"global_step": 232023, "acc_step": 0, "speed/wps": 5522.124524695503, "speed/FLOPS": 244049639195958.06, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046921487897634506, "optim/lr": 2.4752536709345742e-05, "optim/total_tokens": 1946349993984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.291944146156311, "created_at": "2025-06-03T05:16:19.170499+00:00"} {"global_step": 232024, "acc_step": 0, "speed/wps": 5521.624349117557, "speed/FLOPS": 244027533995543.56, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04353705793619156, "optim/lr": 2.4748989484251195e-05, "optim/total_tokens": 1946358382592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3000668287277222, "created_at": "2025-06-03T05:16:22.146303+00:00"} {"global_step": 232025, "acc_step": 0, "speed/wps": 5520.199809393896, "speed/FLOPS": 243964576631213.03, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05280917510390282, "optim/lr": 2.474544225915665e-05, "optim/total_tokens": 1946366771200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2937555313110352, "created_at": "2025-06-03T05:16:25.122449+00:00"} {"global_step": 232026, "acc_step": 0, "speed/wps": 5548.566206415935, "speed/FLOPS": 245218226187205.2, "speed/curr_iter_time": 2.9521, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9521, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.27, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.041951145976781845, "optim/lr": 2.4741895034062323e-05, "optim/total_tokens": 1946375159808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3005956411361694, "created_at": "2025-06-03T05:16:28.082815+00:00"} {"global_step": 232027, "acc_step": 0, "speed/wps": 5536.532247068382, "speed/FLOPS": 244686386779431.03, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 190.68, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05605978146195412, "optim/lr": 2.4738347808967776e-05, "optim/total_tokens": 1946383548416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2736012935638428, "created_at": "2025-06-03T05:16:31.046548+00:00"} {"global_step": 232028, "acc_step": 0, "speed/wps": 5533.417629502573, "speed/FLOPS": 244548736625080.12, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0438259094953537, "optim/lr": 2.473480058387323e-05, "optim/total_tokens": 1946391937024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2790653705596924, "created_at": "2025-06-03T05:16:34.017318+00:00"} {"global_step": 232029, "acc_step": 0, "speed/wps": 5512.976638125926, "speed/FLOPS": 243645349432710.84, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0523708239197731, "optim/lr": 2.4731253358778684e-05, "optim/total_tokens": 1946400325632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2863951921463013, "created_at": "2025-06-03T05:16:36.996769+00:00"} {"global_step": 232030, "acc_step": 0, "speed/wps": 5525.732479881031, "speed/FLOPS": 244209092347969.7, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043514057993888855, "optim/lr": 2.4727706133684357e-05, "optim/total_tokens": 1946408714240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2999099493026733, "created_at": "2025-06-03T05:16:39.965553+00:00"} {"global_step": 232031, "acc_step": 0, "speed/wps": 5521.497450359073, "speed/FLOPS": 244021925719945.28, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.049684807658195496, "optim/lr": 2.472415890858981e-05, "optim/total_tokens": 1946417102848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3054972887039185, "created_at": "2025-06-03T05:16:42.939882+00:00"} {"global_step": 232032, "acc_step": 0, "speed/wps": 5534.960811694646, "speed/FLOPS": 244616937379247.28, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045146018266677856, "optim/lr": 2.4720611683495265e-05, "optim/total_tokens": 1946425491456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2885981798171997, "created_at": "2025-06-03T05:16:45.903631+00:00"} {"global_step": 232033, "acc_step": 0, "speed/wps": 5517.418272596125, "speed/FLOPS": 243841646941947.47, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0445050373673439, "optim/lr": 2.4717064458400718e-05, "optim/total_tokens": 1946433880064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2868363857269287, "created_at": "2025-06-03T05:16:48.882196+00:00"} {"global_step": 232034, "acc_step": 0, "speed/wps": 5512.243111532995, "speed/FLOPS": 243612931311832.72, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.75 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.75, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04451078549027443, "optim/lr": 2.4713517233306392e-05, "optim/total_tokens": 1946442268672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2749500274658203, "created_at": "2025-06-03T05:16:51.861319+00:00"} {"global_step": 232035, "acc_step": 0, "speed/wps": 5533.968827114901, "speed/FLOPS": 244573096738259.9, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0456109493970871, "optim/lr": 2.4709970008211846e-05, "optim/total_tokens": 1946450657280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.3067320585250854, "created_at": "2025-06-03T05:16:54.825886+00:00"} {"global_step": 232036, "acc_step": 0, "speed/wps": 5524.575502632523, "speed/FLOPS": 244157959875532.03, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.054030537605285645, "optim/lr": 2.47064227831173e-05, "optim/total_tokens": 1946459045888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.281754970550537, "created_at": "2025-06-03T05:16:57.799200+00:00"} {"global_step": 232037, "acc_step": 0, "speed/wps": 5522.855556319119, "speed/FLOPS": 244081947051962.84, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.09588214755058289, "optim/lr": 2.4702875558022753e-05, "optim/total_tokens": 1946467434496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2984939813613892, "created_at": "2025-06-03T05:17:00.770180+00:00"} {"global_step": 232038, "acc_step": 0, "speed/wps": 5527.375655377308, "speed/FLOPS": 244281712294370.5, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04923612251877785, "optim/lr": 2.4699328332928427e-05, "optim/total_tokens": 1946475823104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.289442777633667, "created_at": "2025-06-03T05:17:03.743257+00:00"} {"global_step": 232039, "acc_step": 0, "speed/wps": 5514.026155791219, "speed/FLOPS": 243691732741598.4, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04274527356028557, "optim/lr": 2.469578110783388e-05, "optim/total_tokens": 1946484211712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3004528284072876, "created_at": "2025-06-03T05:17:06.718425+00:00"} {"global_step": 232040, "acc_step": 0, "speed/wps": 5518.091040136115, "speed/FLOPS": 243871379823678.62, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044834911823272705, "optim/lr": 2.4692233882739334e-05, "optim/total_tokens": 1946492600320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2928410768508911, "created_at": "2025-06-03T05:17:09.694331+00:00"} {"global_step": 232041, "acc_step": 0, "speed/wps": 5520.123377712668, "speed/FLOPS": 243961198742115.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042300913482904434, "optim/lr": 2.4688686657644788e-05, "optim/total_tokens": 1946500988928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.300260066986084, "created_at": "2025-06-03T05:17:12.668513+00:00"} {"global_step": 232042, "acc_step": 0, "speed/wps": 5511.479785892913, "speed/FLOPS": 243579196225595.94, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04281261935830116, "optim/lr": 2.468513943255046e-05, "optim/total_tokens": 1946509377536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2872951030731201, "created_at": "2025-06-03T05:17:15.644870+00:00"} {"global_step": 232043, "acc_step": 0, "speed/wps": 5537.687103555979, "speed/FLOPS": 244737425525091.44, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.66, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04363692179322243, "optim/lr": 2.4681592207455915e-05, "optim/total_tokens": 1946517766144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294702410697937, "created_at": "2025-06-03T05:17:18.611636+00:00"} {"global_step": 232044, "acc_step": 0, "speed/wps": 5531.6582823211675, "speed/FLOPS": 244470982484817.25, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04385015368461609, "optim/lr": 2.467804498236137e-05, "optim/total_tokens": 1946526154752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2873637676239014, "created_at": "2025-06-03T05:17:21.577229+00:00"} {"global_step": 232045, "acc_step": 0, "speed/wps": 5516.621593243602, "speed/FLOPS": 243806437792340.56, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04860956221818924, "optim/lr": 2.4674497757267046e-05, "optim/total_tokens": 1946534543360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2990410327911377, "created_at": "2025-06-03T05:17:24.551840+00:00"} {"global_step": 232046, "acc_step": 0, "speed/wps": 5526.125058997562, "speed/FLOPS": 244226442335518.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04297900199890137, "optim/lr": 2.46709505321725e-05, "optim/total_tokens": 1946542931968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2920230627059937, "created_at": "2025-06-03T05:17:27.523807+00:00"} {"global_step": 232047, "acc_step": 0, "speed/wps": 5524.720873622548, "speed/FLOPS": 244164384529214.97, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04904421418905258, "optim/lr": 2.466740330707795e-05, "optim/total_tokens": 1946551320576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2987552881240845, "created_at": "2025-06-03T05:17:30.492949+00:00"} {"global_step": 232048, "acc_step": 0, "speed/wps": 5522.4358555689, "speed/FLOPS": 244063398427026.3, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04273392632603645, "optim/lr": 2.4663856081983403e-05, "optim/total_tokens": 1946559709184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.295418381690979, "created_at": "2025-06-03T05:17:33.463595+00:00"} {"global_step": 232049, "acc_step": 0, "speed/wps": 5527.145428095546, "speed/FLOPS": 244271537426926.66, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.08255463093519211, "optim/lr": 2.466030885688908e-05, "optim/total_tokens": 1946568097792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2978955507278442, "created_at": "2025-06-03T05:17:36.435237+00:00"} {"global_step": 232050, "acc_step": 0, "speed/wps": 5523.508977447493, "speed/FLOPS": 244110824921324.44, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042851079255342484, "optim/lr": 2.4656761631794534e-05, "optim/total_tokens": 1946576486400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2983933687210083, "created_at": "2025-06-03T05:17:39.405273+00:00"} {"global_step": 232051, "acc_step": 0, "speed/wps": 5530.535448874339, "speed/FLOPS": 244421358993650.0, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04571351781487465, "optim/lr": 2.4653214406699988e-05, "optim/total_tokens": 1946584875008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2805771827697754, "created_at": "2025-06-03T05:17:42.375887+00:00"} {"global_step": 232052, "acc_step": 0, "speed/wps": 5509.925508039899, "speed/FLOPS": 243510505100007.94, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.74 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.74, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04333644360303879, "optim/lr": 2.464966718160544e-05, "optim/total_tokens": 1946593263616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2833868265151978, "created_at": "2025-06-03T05:17:45.353221+00:00"} {"global_step": 232053, "acc_step": 0, "speed/wps": 5528.826348044918, "speed/FLOPS": 244345825484960.66, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04851875454187393, "optim/lr": 2.4646119956511115e-05, "optim/total_tokens": 1946601652224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.288304328918457, "created_at": "2025-06-03T05:17:48.323647+00:00"} {"global_step": 232054, "acc_step": 0, "speed/wps": 5522.642598545321, "speed/FLOPS": 244072535408377.66, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042296018451452255, "optim/lr": 2.464257273141657e-05, "optim/total_tokens": 1946610040832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3024377822875977, "created_at": "2025-06-03T05:17:51.294394+00:00"} {"global_step": 232055, "acc_step": 0, "speed/wps": 5528.060097983397, "speed/FLOPS": 244311961154264.78, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04863434657454491, "optim/lr": 2.4639025506322022e-05, "optim/total_tokens": 1946618429440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2830055952072144, "created_at": "2025-06-03T05:17:54.263836+00:00"} {"global_step": 232056, "acc_step": 0, "speed/wps": 5530.403070069884, "speed/FLOPS": 244415508528069.22, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 190.87, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04214610531926155, "optim/lr": 2.4635478281227476e-05, "optim/total_tokens": 1946626818048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.280415415763855, "created_at": "2025-06-03T05:17:57.230697+00:00"} {"global_step": 232057, "acc_step": 0, "speed/wps": 5523.335057713468, "speed/FLOPS": 244103138559282.44, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.050262827426195145, "optim/lr": 2.463193105613315e-05, "optim/total_tokens": 1946635206656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3081002235412598, "created_at": "2025-06-03T05:18:00.202681+00:00"} {"global_step": 232058, "acc_step": 0, "speed/wps": 5521.441041952185, "speed/FLOPS": 244019432757085.22, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043364282697439194, "optim/lr": 2.4628383831038603e-05, "optim/total_tokens": 1946643595264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2797658443450928, "created_at": "2025-06-03T05:18:03.174040+00:00"} {"global_step": 232059, "acc_step": 0, "speed/wps": 5512.460212882297, "speed/FLOPS": 243622526080246.47, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.73 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.73, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04763945937156677, "optim/lr": 2.4624836605944057e-05, "optim/total_tokens": 1946651983872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2831472158432007, "created_at": "2025-06-03T05:18:06.150148+00:00"} {"global_step": 232060, "acc_step": 0, "speed/wps": 5524.221045525132, "speed/FLOPS": 244142294685661.25, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04250487685203552, "optim/lr": 2.462128938084951e-05, "optim/total_tokens": 1946660372480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2940893173217773, "created_at": "2025-06-03T05:18:09.120396+00:00"} {"global_step": 232061, "acc_step": 0, "speed/wps": 5521.4024295824365, "speed/FLOPS": 244017726287978.38, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04715375229716301, "optim/lr": 2.4617742155755184e-05, "optim/total_tokens": 1946668761088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.284636378288269, "created_at": "2025-06-03T05:18:12.095831+00:00"} {"global_step": 232062, "acc_step": 0, "speed/wps": 5518.428220484734, "speed/FLOPS": 243886281469242.12, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04194941371679306, "optim/lr": 2.4614194930660638e-05, "optim/total_tokens": 1946677149696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2867238521575928, "created_at": "2025-06-03T05:18:15.073699+00:00"} {"global_step": 232063, "acc_step": 0, "speed/wps": 5516.9360677834675, "speed/FLOPS": 243820335957376.0, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04639550670981407, "optim/lr": 2.461064770556609e-05, "optim/total_tokens": 1946685538304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.29643976688385, "created_at": "2025-06-03T05:18:18.050406+00:00"} {"global_step": 232064, "acc_step": 0, "speed/wps": 5532.22997042468, "speed/FLOPS": 244496248172827.5, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 190.86, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04127871245145798, "optim/lr": 2.4607100480471545e-05, "optim/total_tokens": 1946693926912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.3053252696990967, "created_at": "2025-06-03T05:18:21.016408+00:00"} {"global_step": 232065, "acc_step": 0, "speed/wps": 5519.127226991991, "speed/FLOPS": 243917173979023.22, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04828318953514099, "optim/lr": 2.460355325537722e-05, "optim/total_tokens": 1946702315520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2928969860076904, "created_at": "2025-06-03T05:18:23.993249+00:00"} {"global_step": 232066, "acc_step": 0, "speed/wps": 5516.236366031756, "speed/FLOPS": 243789412721348.6, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04286349564790726, "optim/lr": 2.4600006030282673e-05, "optim/total_tokens": 1946710704128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3003919124603271, "created_at": "2025-06-03T05:18:26.967529+00:00"} {"global_step": 232067, "acc_step": 0, "speed/wps": 5516.6128727194, "speed/FLOPS": 243806052389806.53, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046630386263132095, "optim/lr": 2.4596458805188126e-05, "optim/total_tokens": 1946719092736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.306017518043518, "created_at": "2025-06-03T05:18:29.941185+00:00"} {"global_step": 232068, "acc_step": 0, "speed/wps": 5534.4816715941815, "speed/FLOPS": 244595761839268.1, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 190.79, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0438261516392231, "optim/lr": 2.459291158009358e-05, "optim/total_tokens": 1946727481344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2901982069015503, "created_at": "2025-06-03T05:18:32.905336+00:00"} {"global_step": 232069, "acc_step": 0, "speed/wps": 5528.977078106971, "speed/FLOPS": 244352486982197.0, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044183406978845596, "optim/lr": 2.4589364354999254e-05, "optim/total_tokens": 1946735869952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2923789024353027, "created_at": "2025-06-03T05:18:35.876130+00:00"} {"global_step": 232070, "acc_step": 0, "speed/wps": 5530.487074572675, "speed/FLOPS": 244419221097118.56, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 190.92, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04332886263728142, "optim/lr": 2.4585817129904707e-05, "optim/total_tokens": 1946744258560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2886724472045898, "created_at": "2025-06-03T05:18:38.842545+00:00"} {"global_step": 232071, "acc_step": 0, "speed/wps": 5512.35143185776, "speed/FLOPS": 243617718515753.7, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045874036848545074, "optim/lr": 2.458226990481016e-05, "optim/total_tokens": 1946752647168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2869772911071777, "created_at": "2025-06-03T05:18:41.819262+00:00"} {"global_step": 232072, "acc_step": 0, "speed/wps": 5517.151251999657, "speed/FLOPS": 243829845998318.9, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04334175959229469, "optim/lr": 2.4578722679715615e-05, "optim/total_tokens": 1946761035776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2950806617736816, "created_at": "2025-06-03T05:18:44.793055+00:00"} {"global_step": 232073, "acc_step": 0, "speed/wps": 5516.8826889239635, "speed/FLOPS": 243817976885003.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.049344729632139206, "optim/lr": 2.4575175454621292e-05, "optim/total_tokens": 1946769424384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.309206485748291, "created_at": "2025-06-03T05:18:47.767105+00:00"} {"global_step": 232074, "acc_step": 0, "speed/wps": 5518.255938672093, "speed/FLOPS": 243878667494941.62, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0519489124417305, "optim/lr": 2.4571628229526742e-05, "optim/total_tokens": 1946777812992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2792377471923828, "created_at": "2025-06-03T05:18:50.739685+00:00"} {"global_step": 232075, "acc_step": 0, "speed/wps": 5507.45355537248, "speed/FLOPS": 243401257444708.78, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.72 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.72, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042510196566581726, "optim/lr": 2.4568081004432196e-05, "optim/total_tokens": 1946786201600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.28603994846344, "created_at": "2025-06-03T05:18:53.718386+00:00"} {"global_step": 232076, "acc_step": 0, "speed/wps": 5521.2420713784495, "speed/FLOPS": 244010639276149.84, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.047710876911878586, "optim/lr": 2.4564533779337873e-05, "optim/total_tokens": 1946794590208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3090404272079468, "created_at": "2025-06-03T05:18:56.689763+00:00"} {"global_step": 232077, "acc_step": 0, "speed/wps": 5514.38824610313, "speed/FLOPS": 243707735280038.62, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04308099299669266, "optim/lr": 2.4560986554243326e-05, "optim/total_tokens": 1946802978816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.293242335319519, "created_at": "2025-06-03T05:18:59.666242+00:00"} {"global_step": 232078, "acc_step": 0, "speed/wps": 5518.478686406594, "speed/FLOPS": 243888511804680.3, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04700978472828865, "optim/lr": 2.455743932914878e-05, "optim/total_tokens": 1946811367424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2837796211242676, "created_at": "2025-06-03T05:19:02.638910+00:00"} {"global_step": 232079, "acc_step": 0, "speed/wps": 5539.618472003097, "speed/FLOPS": 244822782124814.2, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 190.57, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042931023985147476, "optim/lr": 2.455389210405423e-05, "optim/total_tokens": 1946819756032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2725439071655273, "created_at": "2025-06-03T05:19:05.605849+00:00"} {"global_step": 232080, "acc_step": 0, "speed/wps": 5519.684752530844, "speed/FLOPS": 243941813754166.12, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05231234058737755, "optim/lr": 2.4550344878959907e-05, "optim/total_tokens": 1946828144640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3088029623031616, "created_at": "2025-06-03T05:19:08.582286+00:00"} {"global_step": 232081, "acc_step": 0, "speed/wps": 5529.182365236849, "speed/FLOPS": 244361559622582.84, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 190.98, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04300519451498985, "optim/lr": 2.454679765386536e-05, "optim/total_tokens": 1946836533248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2921470403671265, "created_at": "2025-06-03T05:19:11.550216+00:00"} {"global_step": 232082, "acc_step": 0, "speed/wps": 5520.036044348418, "speed/FLOPS": 243957339054428.38, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04930170997977257, "optim/lr": 2.4543250428770815e-05, "optim/total_tokens": 1946844921856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.298909306526184, "created_at": "2025-06-03T05:19:14.521893+00:00"} {"global_step": 232083, "acc_step": 0, "speed/wps": 5512.390032603038, "speed/FLOPS": 243619424471118.44, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04400663450360298, "optim/lr": 2.4539703203676268e-05, "optim/total_tokens": 1946853310464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.3052172660827637, "created_at": "2025-06-03T05:19:17.504044+00:00"} {"global_step": 232084, "acc_step": 0, "speed/wps": 5521.015708355454, "speed/FLOPS": 244000635189164.4, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04418473318219185, "optim/lr": 2.4536155978581942e-05, "optim/total_tokens": 1946861699072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2888298034667969, "created_at": "2025-06-03T05:19:20.479984+00:00"} {"global_step": 232085, "acc_step": 0, "speed/wps": 5522.922589329474, "speed/FLOPS": 244084909567914.5, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04916438087821007, "optim/lr": 2.4532608753487396e-05, "optim/total_tokens": 1946870087680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.300171971321106, "created_at": "2025-06-03T05:19:23.454201+00:00"} {"global_step": 232086, "acc_step": 0, "speed/wps": 5509.274064693682, "speed/FLOPS": 243481714638494.47, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04792023450136185, "optim/lr": 2.452906152839285e-05, "optim/total_tokens": 1946878476288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2977622747421265, "created_at": "2025-06-03T05:19:26.436016+00:00"} {"global_step": 232087, "acc_step": 0, "speed/wps": 5523.712435230599, "speed/FLOPS": 244119816713946.4, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0485222190618515, "optim/lr": 2.4525514303298303e-05, "optim/total_tokens": 1946886864896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.298363447189331, "created_at": "2025-06-03T05:19:29.408013+00:00"} {"global_step": 232088, "acc_step": 0, "speed/wps": 5531.289564000529, "speed/FLOPS": 244454687022316.47, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04918422922492027, "optim/lr": 2.4521967078203977e-05, "optim/total_tokens": 1946895253504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2967289686203003, "created_at": "2025-06-03T05:19:32.374239+00:00"} {"global_step": 232089, "acc_step": 0, "speed/wps": 5512.580162289632, "speed/FLOPS": 243627827230093.97, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043591782450675964, "optim/lr": 2.451841985310943e-05, "optim/total_tokens": 1946903642112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.28235924243927, "created_at": "2025-06-03T05:19:35.353166+00:00"} {"global_step": 232090, "acc_step": 0, "speed/wps": 5521.598507129348, "speed/FLOPS": 244026391911936.0, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043516892939805984, "optim/lr": 2.4514872628014884e-05, "optim/total_tokens": 1946912030720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2908121347427368, "created_at": "2025-06-03T05:19:38.327046+00:00"} {"global_step": 232091, "acc_step": 0, "speed/wps": 5512.109589714037, "speed/FLOPS": 243607030330861.4, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04418075829744339, "optim/lr": 2.4511325402920338e-05, "optim/total_tokens": 1946920419328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.290846347808838, "created_at": "2025-06-03T05:19:41.307238+00:00"} {"global_step": 232092, "acc_step": 0, "speed/wps": 5515.331381727325, "speed/FLOPS": 243749417047222.3, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046112313866615295, "optim/lr": 2.450777817782601e-05, "optim/total_tokens": 1946928807936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2894046306610107, "created_at": "2025-06-03T05:19:44.284585+00:00"} {"global_step": 232093, "acc_step": 0, "speed/wps": 5527.5926655806215, "speed/FLOPS": 244291303034598.03, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04210584983229637, "optim/lr": 2.4504230952731465e-05, "optim/total_tokens": 1946937196544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2898714542388916, "created_at": "2025-06-03T05:19:47.252733+00:00"} {"global_step": 232094, "acc_step": 0, "speed/wps": 5529.114930384612, "speed/FLOPS": 244358579347276.8, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04911860451102257, "optim/lr": 2.450068372763692e-05, "optim/total_tokens": 1946945585152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3042901754379272, "created_at": "2025-06-03T05:19:50.222856+00:00"} {"global_step": 232095, "acc_step": 0, "speed/wps": 5525.096713973501, "speed/FLOPS": 244180994749001.75, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04156922921538353, "optim/lr": 2.4497136502542372e-05, "optim/total_tokens": 1946953973760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2687898874282837, "created_at": "2025-06-03T05:19:53.196267+00:00"} {"global_step": 232096, "acc_step": 0, "speed/wps": 5525.5023907614, "speed/FLOPS": 244198923586584.88, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044761113822460175, "optim/lr": 2.4493589277448046e-05, "optim/total_tokens": 1946962362368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2886948585510254, "created_at": "2025-06-03T05:19:56.169551+00:00"} {"global_step": 232097, "acc_step": 0, "speed/wps": 5521.633448570502, "speed/FLOPS": 244027936144788.47, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04321436583995819, "optim/lr": 2.44900420523535e-05, "optim/total_tokens": 1946970750976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3008925914764404, "created_at": "2025-06-03T05:19:59.140421+00:00"} {"global_step": 232098, "acc_step": 0, "speed/wps": 5512.293759745052, "speed/FLOPS": 243615169703564.62, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04354686290025711, "optim/lr": 2.4486494827258953e-05, "optim/total_tokens": 1946979139584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2968140840530396, "created_at": "2025-06-03T05:20:02.116001+00:00"} {"global_step": 232099, "acc_step": 0, "speed/wps": 5520.556774954111, "speed/FLOPS": 243980352681859.12, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0004, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.25, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042741809040308, "optim/lr": 2.4482947602164407e-05, "optim/total_tokens": 1946987528192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2874139547348022, "created_at": "2025-06-03T05:20:05.087799+00:00"} {"global_step": 232100, "acc_step": 0, "speed/wps": 5513.162090646757, "speed/FLOPS": 243653545484899.53, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04463120922446251, "optim/lr": 2.447940037707008e-05, "optim/total_tokens": 1946995916800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2943750619888306, "created_at": "2025-06-03T05:20:08.067927+00:00"} {"global_step": 232101, "acc_step": 0, "speed/wps": 5505.491537561665, "speed/FLOPS": 243314546299988.28, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.041623737663030624, "optim/lr": 2.4475853151975534e-05, "optim/total_tokens": 1947004305408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3010755777359009, "created_at": "2025-06-03T05:20:11.047462+00:00"} {"global_step": 232102, "acc_step": 0, "speed/wps": 5510.60146821861, "speed/FLOPS": 243540379080029.12, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.048241809010505676, "optim/lr": 2.4472305926880988e-05, "optim/total_tokens": 1947012694016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2982947826385498, "created_at": "2025-06-03T05:20:14.025005+00:00"} {"global_step": 232103, "acc_step": 0, "speed/wps": 5521.6750208265885, "speed/FLOPS": 244029773425721.4, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04239688813686371, "optim/lr": 2.4468758701786665e-05, "optim/total_tokens": 1947021082624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2918423414230347, "created_at": "2025-06-03T05:20:17.000545+00:00"} {"global_step": 232104, "acc_step": 0, "speed/wps": 5516.804309356815, "speed/FLOPS": 243814512909318.72, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.049209073185920715, "optim/lr": 2.446521147669212e-05, "optim/total_tokens": 1947029471232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.295789361000061, "created_at": "2025-06-03T05:20:19.974047+00:00"} {"global_step": 232105, "acc_step": 0, "speed/wps": 5516.6104504045115, "speed/FLOPS": 243805945335887.0, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04356260225176811, "optim/lr": 2.4461664251597572e-05, "optim/total_tokens": 1947037859840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2892811298370361, "created_at": "2025-06-03T05:20:22.951605+00:00"} {"global_step": 232106, "acc_step": 0, "speed/wps": 5506.773669117314, "speed/FLOPS": 243371209952203.75, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0021, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05199727043509483, "optim/lr": 2.4458117026503023e-05, "optim/total_tokens": 1947046248448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2840418815612793, "created_at": "2025-06-03T05:20:25.930507+00:00"} {"global_step": 232107, "acc_step": 0, "speed/wps": 5506.283597191604, "speed/FLOPS": 243349551281502.88, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04251498728990555, "optim/lr": 2.44545698014087e-05, "optim/total_tokens": 1947054637056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.281721591949463, "created_at": "2025-06-03T05:20:28.909502+00:00"} {"global_step": 232108, "acc_step": 0, "speed/wps": 5519.209536087461, "speed/FLOPS": 243920811619746.84, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04793418198823929, "optim/lr": 2.4451022576314153e-05, "optim/total_tokens": 1947063025664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.309964895248413, "created_at": "2025-06-03T05:20:31.883561+00:00"} {"global_step": 232109, "acc_step": 0, "speed/wps": 5510.846353571649, "speed/FLOPS": 243551201759196.6, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04181792587041855, "optim/lr": 2.4447475351219607e-05, "optim/total_tokens": 1947071414272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2921605110168457, "created_at": "2025-06-03T05:20:34.860595+00:00"} {"global_step": 232110, "acc_step": 0, "speed/wps": 5508.8464732765915, "speed/FLOPS": 243462817286470.34, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045466240495443344, "optim/lr": 2.444392812612506e-05, "optim/total_tokens": 1947079802880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2853955030441284, "created_at": "2025-06-03T05:20:37.838789+00:00"} {"global_step": 232111, "acc_step": 0, "speed/wps": 5520.152510378178, "speed/FLOPS": 243962486256816.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.042129095643758774, "optim/lr": 2.4440380901030734e-05, "optim/total_tokens": 1947088191488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2963916063308716, "created_at": "2025-06-03T05:20:40.814553+00:00"} {"global_step": 232112, "acc_step": 0, "speed/wps": 5526.835413459052, "speed/FLOPS": 244257836366792.38, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05089897662401199, "optim/lr": 2.4436833675936188e-05, "optim/total_tokens": 1947096580096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2811002731323242, "created_at": "2025-06-03T05:20:43.787488+00:00"} {"global_step": 232113, "acc_step": 0, "speed/wps": 5504.789207189296, "speed/FLOPS": 243283506892382.28, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.044261541217565536, "optim/lr": 2.443328645084164e-05, "optim/total_tokens": 1947104968704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2919756174087524, "created_at": "2025-06-03T05:20:46.771351+00:00"} {"global_step": 232114, "acc_step": 0, "speed/wps": 5507.661411044434, "speed/FLOPS": 243410443601507.38, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04891183599829674, "optim/lr": 2.4429739225747095e-05, "optim/total_tokens": 1947113357312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2926714420318604, "created_at": "2025-06-03T05:20:49.754822+00:00"} {"global_step": 232115, "acc_step": 0, "speed/wps": 5490.160702782852, "speed/FLOPS": 242637001873090.66, "speed/curr_iter_time": 2.9833, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9833, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04674730822443962, "optim/lr": 2.442619200065277e-05, "optim/total_tokens": 1947121745920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2915198802947998, "created_at": "2025-06-03T05:20:52.747172+00:00"} {"global_step": 232116, "acc_step": 0, "speed/wps": 5488.07830681672, "speed/FLOPS": 242544970630056.4, "speed/curr_iter_time": 2.9838, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9838, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.71 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.71, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0492100715637207, "optim/lr": 2.4422644775558223e-05, "optim/total_tokens": 1947130134528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2948734760284424, "created_at": "2025-06-03T05:20:55.743125+00:00"} {"global_step": 232117, "acc_step": 0, "speed/wps": 5497.523222735632, "speed/FLOPS": 242962387570210.2, "speed/curr_iter_time": 2.9794, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9794, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.7 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.7, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04678494483232498, "optim/lr": 2.4419097550463676e-05, "optim/total_tokens": 1947138523136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2992037534713745, "created_at": "2025-06-03T05:20:58.728273+00:00"} {"global_step": 232118, "acc_step": 0, "speed/wps": 5510.319033419657, "speed/FLOPS": 243527896907547.75, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05410558357834816, "optim/lr": 2.441555032536913e-05, "optim/total_tokens": 1947146911744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.287076473236084, "created_at": "2025-06-03T05:21:01.706519+00:00"} {"global_step": 232119, "acc_step": 0, "speed/wps": 5514.5374989285465, "speed/FLOPS": 243714331490976.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04194061830639839, "optim/lr": 2.4412003100274804e-05, "optim/total_tokens": 1947155300352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2881449460983276, "created_at": "2025-06-03T05:21:04.686012+00:00"} {"global_step": 232120, "acc_step": 0, "speed/wps": 5520.181178700458, "speed/FLOPS": 243963753249923.6, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04521369934082031, "optim/lr": 2.4408455875180257e-05, "optim/total_tokens": 1947163688960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2987333536148071, "created_at": "2025-06-03T05:21:07.662119+00:00"} {"global_step": 232121, "acc_step": 0, "speed/wps": 5511.611441632012, "speed/FLOPS": 243585014735388.97, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.041973017156124115, "optim/lr": 2.440490865008571e-05, "optim/total_tokens": 1947172077568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3109904527664185, "created_at": "2025-06-03T05:21:10.639694+00:00"} {"global_step": 232122, "acc_step": 0, "speed/wps": 5512.112882851748, "speed/FLOPS": 243607175870692.44, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043292831629514694, "optim/lr": 2.4401361424991165e-05, "optim/total_tokens": 1947180466176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.291243076324463, "created_at": "2025-06-03T05:21:13.619257+00:00"} {"global_step": 232123, "acc_step": 0, "speed/wps": 5509.0334391788665, "speed/FLOPS": 243471080222372.66, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04176639765501022, "optim/lr": 2.439781419989684e-05, "optim/total_tokens": 1947188854784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2895219326019287, "created_at": "2025-06-03T05:21:16.597691+00:00"} {"global_step": 232124, "acc_step": 0, "speed/wps": 5511.463705624045, "speed/FLOPS": 243578485560018.25, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043697334825992584, "optim/lr": 2.4394266974802292e-05, "optim/total_tokens": 1947197243392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.293764352798462, "created_at": "2025-06-03T05:21:19.574270+00:00"} {"global_step": 232125, "acc_step": 0, "speed/wps": 5512.6877832859345, "speed/FLOPS": 243632583527276.3, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04268861562013626, "optim/lr": 2.4390719749707746e-05, "optim/total_tokens": 1947205632000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2839552164077759, "created_at": "2025-06-03T05:21:22.554811+00:00"} {"global_step": 232126, "acc_step": 0, "speed/wps": 5498.395899823466, "speed/FLOPS": 243000955430726.2, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046574316918849945, "optim/lr": 2.43871725246132e-05, "optim/total_tokens": 1947214020608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2971361875534058, "created_at": "2025-06-03T05:21:25.538949+00:00"} {"global_step": 232127, "acc_step": 0, "speed/wps": 5521.832834722495, "speed/FLOPS": 244036747992155.75, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.27, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04634920135140419, "optim/lr": 2.4383625299518873e-05, "optim/total_tokens": 1947222409216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3035733699798584, "created_at": "2025-06-03T05:21:28.513141+00:00"} {"global_step": 232128, "acc_step": 0, "speed/wps": 5530.38619636887, "speed/FLOPS": 244414762796851.8, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.65 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.65, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05417758971452713, "optim/lr": 2.4380078074424327e-05, "optim/total_tokens": 1947230797824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.285685658454895, "created_at": "2025-06-03T05:21:31.483080+00:00"} {"global_step": 232129, "acc_step": 0, "speed/wps": 5517.947020802936, "speed/FLOPS": 243865014906309.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04237223416566849, "optim/lr": 2.437653084932978e-05, "optim/total_tokens": 1947239186432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.269887924194336, "created_at": "2025-06-03T05:21:34.461899+00:00"} {"global_step": 232130, "acc_step": 0, "speed/wps": 5514.148219748765, "speed/FLOPS": 243697127343741.97, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04899287968873978, "optim/lr": 2.4372983624235458e-05, "optim/total_tokens": 1947247575040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.305321455001831, "created_at": "2025-06-03T05:21:37.437757+00:00"} {"global_step": 232131, "acc_step": 0, "speed/wps": 5519.54538591342, "speed/FLOPS": 243935654463019.03, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0439215749502182, "optim/lr": 2.436943639914091e-05, "optim/total_tokens": 1947255963648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2983423471450806, "created_at": "2025-06-03T05:21:40.414783+00:00"} {"global_step": 232132, "acc_step": 0, "speed/wps": 5524.808435536279, "speed/FLOPS": 244168254317619.34, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.046174485236406326, "optim/lr": 2.436588917404636e-05, "optim/total_tokens": 1947264352256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2702544927597046, "created_at": "2025-06-03T05:21:43.385101+00:00"} {"global_step": 232133, "acc_step": 0, "speed/wps": 5507.232270441003, "speed/FLOPS": 243391477783376.44, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0447867177426815, "optim/lr": 2.4362341948951815e-05, "optim/total_tokens": 1947272740864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2975502014160156, "created_at": "2025-06-03T05:21:46.365168+00:00"} {"global_step": 232134, "acc_step": 0, "speed/wps": 5508.195676103276, "speed/FLOPS": 243434055382491.72, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04509914293885231, "optim/lr": 2.4358794723857492e-05, "optim/total_tokens": 1947281129472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.291407585144043, "created_at": "2025-06-03T05:21:49.344364+00:00"} {"global_step": 232135, "acc_step": 0, "speed/wps": 5517.96937920122, "speed/FLOPS": 243866003033073.4, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04745786637067795, "optim/lr": 2.4355247498762946e-05, "optim/total_tokens": 1947289518080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2915302515029907, "created_at": "2025-06-03T05:21:52.321937+00:00"} {"global_step": 232136, "acc_step": 0, "speed/wps": 5518.385123165838, "speed/FLOPS": 243884376788339.0, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.051442213356494904, "optim/lr": 2.43517002736684e-05, "optim/total_tokens": 1947297906688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.292742133140564, "created_at": "2025-06-03T05:21:55.295608+00:00"} {"global_step": 232137, "acc_step": 0, "speed/wps": 5504.141193660232, "speed/FLOPS": 243254868011231.56, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.045512743294239044, "optim/lr": 2.434815304857385e-05, "optim/total_tokens": 1947306295296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3061338663101196, "created_at": "2025-06-03T05:21:58.276621+00:00"} {"global_step": 232138, "acc_step": 0, "speed/wps": 5514.008477984075, "speed/FLOPS": 243690951473005.88, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05408423766493797, "optim/lr": 2.4344605823479527e-05, "optim/total_tokens": 1947314683904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2982302904129028, "created_at": "2025-06-03T05:22:01.252144+00:00"} {"global_step": 232139, "acc_step": 0, "speed/wps": 5514.621150489896, "speed/FLOPS": 243718028461820.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0434785895049572, "optim/lr": 2.434105859838498e-05, "optim/total_tokens": 1947323072512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2860487699508667, "created_at": "2025-06-03T05:22:04.227363+00:00"} {"global_step": 232140, "acc_step": 0, "speed/wps": 5512.104886842145, "speed/FLOPS": 243606822487995.28, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.050812747329473495, "optim/lr": 2.4337511373290434e-05, "optim/total_tokens": 1947331461120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2949150800704956, "created_at": "2025-06-03T05:22:07.207619+00:00"} {"global_step": 232141, "acc_step": 0, "speed/wps": 5514.364400815378, "speed/FLOPS": 243706681440371.25, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04649784043431282, "optim/lr": 2.4333964148195888e-05, "optim/total_tokens": 1947339849728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2969081401824951, "created_at": "2025-06-03T05:22:10.182980+00:00"} {"global_step": 232142, "acc_step": 0, "speed/wps": 5490.014839618439, "speed/FLOPS": 242630555467818.94, "speed/curr_iter_time": 2.9835, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9835, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05137242376804352, "optim/lr": 2.433041692310156e-05, "optim/total_tokens": 1947348238336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.284848928451538, "created_at": "2025-06-03T05:22:13.171676+00:00"} {"global_step": 232143, "acc_step": 0, "speed/wps": 5503.776971715672, "speed/FLOPS": 243238771265538.94, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04644833505153656, "optim/lr": 2.4326869698007015e-05, "optim/total_tokens": 1947356626944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3108311891555786, "created_at": "2025-06-03T05:22:16.153834+00:00"} {"global_step": 232144, "acc_step": 0, "speed/wps": 5486.206788713577, "speed/FLOPS": 242462259109195.53, "speed/curr_iter_time": 2.9856, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9856, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.69 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.69, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.0474686361849308, "optim/lr": 2.432332247291247e-05, "optim/total_tokens": 1947365015552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2965290546417236, "created_at": "2025-06-03T05:22:19.150580+00:00"} {"global_step": 232145, "acc_step": 0, "speed/wps": 5495.0823797422945, "speed/FLOPS": 242854514803271.7, "speed/curr_iter_time": 2.9807, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9807, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.68 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.68, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04660243168473244, "optim/lr": 2.4319775247817922e-05, "optim/total_tokens": 1947373404160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.294397234916687, "created_at": "2025-06-03T05:22:22.137111+00:00"} {"global_step": 232146, "acc_step": 0, "speed/wps": 5496.973529303393, "speed/FLOPS": 242938093934091.28, "speed/curr_iter_time": 2.9798, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9798, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04520460590720177, "optim/lr": 2.4316228022723596e-05, "optim/total_tokens": 1947381792768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2753881216049194, "created_at": "2025-06-03T05:22:25.126073+00:00"} {"global_step": 232147, "acc_step": 0, "speed/wps": 5498.540704477348, "speed/FLOPS": 243007355055250.4, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04418903589248657, "optim/lr": 2.431268079762905e-05, "optim/total_tokens": 1947390181376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2983310222625732, "created_at": "2025-06-03T05:22:28.110774+00:00"} {"global_step": 232148, "acc_step": 0, "speed/wps": 5505.79800950619, "speed/FLOPS": 243328090791270.7, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04370376467704773, "optim/lr": 2.4309133572534503e-05, "optim/total_tokens": 1947398569984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2872323989868164, "created_at": "2025-06-03T05:22:31.091252+00:00"} {"global_step": 232149, "acc_step": 0, "speed/wps": 5506.815722940772, "speed/FLOPS": 243373068515949.6, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04394912347197533, "optim/lr": 2.4305586347439957e-05, "optim/total_tokens": 1947406958592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3006720542907715, "created_at": "2025-06-03T05:22:34.073605+00:00"} {"global_step": 232150, "acc_step": 0, "speed/wps": 5493.80445192186, "speed/FLOPS": 242798036934636.03, "speed/curr_iter_time": 2.9807, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9807, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.67 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.67, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04310963302850723, "optim/lr": 2.430203912234563e-05, "optim/total_tokens": 1947415347200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2743674516677856, "created_at": "2025-06-03T05:22:37.060336+00:00"} {"global_step": 232151, "acc_step": 0, "speed/wps": 5501.916943602256, "speed/FLOPS": 243156567543412.88, "speed/curr_iter_time": 2.9771, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9771, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04641887918114662, "optim/lr": 2.4298491897251084e-05, "optim/total_tokens": 1947423735808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2970516681671143, "created_at": "2025-06-03T05:22:40.046256+00:00"} {"global_step": 232152, "acc_step": 0, "speed/wps": 5516.578957044757, "speed/FLOPS": 243804553490583.47, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.65 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.65, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043581753969192505, "optim/lr": 2.4294944672156538e-05, "optim/total_tokens": 1947432124416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2742359638214111, "created_at": "2025-06-03T05:22:43.020344+00:00"} {"global_step": 232153, "acc_step": 0, "speed/wps": 5520.283660546604, "speed/FLOPS": 243968282422973.6, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.05079972743988037, "optim/lr": 2.429139744706199e-05, "optim/total_tokens": 1947440513024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2957897186279297, "created_at": "2025-06-03T05:22:45.992494+00:00"} {"global_step": 232154, "acc_step": 0, "speed/wps": 5513.8967168911895, "speed/FLOPS": 243686012204745.44, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.65 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.65, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04414163529872894, "optim/lr": 2.4287850221967665e-05, "optim/total_tokens": 1947448901632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.279564380645752, "created_at": "2025-06-03T05:22:48.968029+00:00"} {"global_step": 232155, "acc_step": 0, "speed/wps": 5530.551989226813, "speed/FLOPS": 244422089992568.16, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.047704264521598816, "optim/lr": 2.428430299687312e-05, "optim/total_tokens": 1947457290240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3096526861190796, "created_at": "2025-06-03T05:22:51.934870+00:00"} {"global_step": 232156, "acc_step": 0, "speed/wps": 5512.04982860527, "speed/FLOPS": 243604389195739.0, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.65 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.65, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04321865364909172, "optim/lr": 2.4280755771778573e-05, "optim/total_tokens": 1947465678848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2999426126480103, "created_at": "2025-06-03T05:22:54.912789+00:00"} {"global_step": 232157, "acc_step": 0, "speed/wps": 5523.419199671717, "speed/FLOPS": 244106857203159.47, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04496267810463905, "optim/lr": 2.427720854668425e-05, "optim/total_tokens": 1947474067456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2985386848449707, "created_at": "2025-06-03T05:22:57.883592+00:00"} {"global_step": 232158, "acc_step": 0, "speed/wps": 5516.4951479085985, "speed/FLOPS": 243800849555739.3, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04301205649971962, "optim/lr": 2.42736613215897e-05, "optim/total_tokens": 1947482456064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2841782569885254, "created_at": "2025-06-03T05:23:00.858389+00:00"} {"global_step": 232159, "acc_step": 0, "speed/wps": 5519.862555412488, "speed/FLOPS": 243949671731457.16, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04458176717162132, "optim/lr": 2.4270114096495154e-05, "optim/total_tokens": 1947490844672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2960665225982666, "created_at": "2025-06-03T05:23:03.835820+00:00"} {"global_step": 232160, "acc_step": 0, "speed/wps": 5513.974462977028, "speed/FLOPS": 243689448183799.0, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04294687509536743, "optim/lr": 2.4266566871400607e-05, "optim/total_tokens": 1947499233280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2899576425552368, "created_at": "2025-06-03T05:23:06.812133+00:00"} {"global_step": 232161, "acc_step": 0, "speed/wps": 5530.621740329056, "speed/FLOPS": 244425172634268.78, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04279337450861931, "optim/lr": 2.4263019646306285e-05, "optim/total_tokens": 1947507621888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2885754108428955, "created_at": "2025-06-03T05:23:09.782041+00:00"} {"global_step": 232162, "acc_step": 0, "speed/wps": 5525.222694954991, "speed/FLOPS": 244186562463554.5, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04239702224731445, "optim/lr": 2.4259472421211738e-05, "optim/total_tokens": 1947516010496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3039618730545044, "created_at": "2025-06-03T05:23:12.754923+00:00"} {"global_step": 232163, "acc_step": 0, "speed/wps": 5523.928195228381, "speed/FLOPS": 244129352201488.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04340152069926262, "optim/lr": 2.4255925196117192e-05, "optim/total_tokens": 1947524399104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2813702821731567, "created_at": "2025-06-03T05:23:15.730717+00:00"} {"global_step": 232164, "acc_step": 0, "speed/wps": 5511.408562207737, "speed/FLOPS": 243576048503267.03, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04289216548204422, "optim/lr": 2.4252377971022642e-05, "optim/total_tokens": 1947532787712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2836872339248657, "created_at": "2025-06-03T05:23:18.708069+00:00"} {"global_step": 232165, "acc_step": 0, "speed/wps": 5519.516932869043, "speed/FLOPS": 243934396984093.4, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042422596365213394, "optim/lr": 2.424883074592832e-05, "optim/total_tokens": 1947541176320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2934935092926025, "created_at": "2025-06-03T05:23:21.680653+00:00"} {"global_step": 232166, "acc_step": 0, "speed/wps": 5527.964842078635, "speed/FLOPS": 244307751330838.22, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04413736239075661, "optim/lr": 2.4245283520833773e-05, "optim/total_tokens": 1947549564928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2974179983139038, "created_at": "2025-06-03T05:23:24.652434+00:00"} {"global_step": 232167, "acc_step": 0, "speed/wps": 5508.750935230416, "speed/FLOPS": 243458594993837.44, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04295036569237709, "optim/lr": 2.4241736295739226e-05, "optim/total_tokens": 1947557953536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.283634901046753, "created_at": "2025-06-03T05:23:27.635351+00:00"} {"global_step": 232168, "acc_step": 0, "speed/wps": 5494.423672336872, "speed/FLOPS": 242825403307522.16, "speed/curr_iter_time": 2.9812, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9812, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.66 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.66, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04252135753631592, "optim/lr": 2.423818907064468e-05, "optim/total_tokens": 1947566342144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3033372163772583, "created_at": "2025-06-03T05:23:30.628344+00:00"} {"global_step": 232169, "acc_step": 0, "speed/wps": 5509.992773747208, "speed/FLOPS": 243513477899973.9, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.04287151247262955, "optim/lr": 2.4234641845550354e-05, "optim/total_tokens": 1947574730752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2875300645828247, "created_at": "2025-06-03T05:23:33.606468+00:00"} {"global_step": 232170, "acc_step": 0, "speed/wps": 5520.719838054101, "speed/FLOPS": 243987559236246.12, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04210052266716957, "optim/lr": 2.4231094620455807e-05, "optim/total_tokens": 1947583119360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2680188417434692, "created_at": "2025-06-03T05:23:36.582521+00:00"} {"global_step": 232171, "acc_step": 0, "speed/wps": 5520.610329313809, "speed/FLOPS": 243982719510441.75, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04190943017601967, "optim/lr": 2.422754739536126e-05, "optim/total_tokens": 1947591507968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2786102294921875, "created_at": "2025-06-03T05:23:39.558719+00:00"} {"global_step": 232172, "acc_step": 0, "speed/wps": 5515.1209121641405, "speed/FLOPS": 243740115369810.44, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043175142258405685, "optim/lr": 2.4224000170266715e-05, "optim/total_tokens": 1947599896576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2830628156661987, "created_at": "2025-06-03T05:23:42.537675+00:00"} {"global_step": 232173, "acc_step": 0, "speed/wps": 5512.774782363988, "speed/FLOPS": 243636428441224.66, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04243290051817894, "optim/lr": 2.422045294517239e-05, "optim/total_tokens": 1947608285184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2798540592193604, "created_at": "2025-06-03T05:23:45.518336+00:00"} {"global_step": 232174, "acc_step": 0, "speed/wps": 5517.852239440877, "speed/FLOPS": 243860826055241.88, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04329199343919754, "optim/lr": 2.4216905720077842e-05, "optim/total_tokens": 1947616673792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2995471954345703, "created_at": "2025-06-03T05:23:48.493216+00:00"} {"global_step": 232175, "acc_step": 0, "speed/wps": 5500.5610980165975, "speed/FLOPS": 243096646108373.62, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.65 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.65, "speed/est_time_remaining_days": 0.24, "optim/grad_norm": 0.043286047875881195, "optim/lr": 2.4213358494983296e-05, "optim/total_tokens": 1947625062400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3116965293884277, "created_at": "2025-06-03T05:23:51.476464+00:00"} {"global_step": 232176, "acc_step": 0, "speed/wps": 5507.384883116171, "speed/FLOPS": 243398222482476.4, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04358172044157982, "optim/lr": 2.420981126988875e-05, "optim/total_tokens": 1947633451008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3000364303588867, "created_at": "2025-06-03T05:23:54.461208+00:00"} {"global_step": 232177, "acc_step": 0, "speed/wps": 5507.820772684252, "speed/FLOPS": 243417486570300.5, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.64 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.64, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04310334101319313, "optim/lr": 2.4206264044794423e-05, "optim/total_tokens": 1947641839616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2891550064086914, "created_at": "2025-06-03T05:23:57.440432+00:00"} {"global_step": 232178, "acc_step": 0, "speed/wps": 5528.1192982370585, "speed/FLOPS": 244314577502462.25, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044446419924497604, "optim/lr": 2.4202716819699877e-05, "optim/total_tokens": 1947650228224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2929143905639648, "created_at": "2025-06-03T05:24:00.408652+00:00"} {"global_step": 232179, "acc_step": 0, "speed/wps": 5509.135794344407, "speed/FLOPS": 243475603796788.34, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04567009210586548, "optim/lr": 2.419916959460533e-05, "optim/total_tokens": 1947658616832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2871094942092896, "created_at": "2025-06-03T05:24:03.387716+00:00"} {"global_step": 232180, "acc_step": 0, "speed/wps": 5520.586535861815, "speed/FLOPS": 243981667961649.53, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042090725153684616, "optim/lr": 2.4195622369510784e-05, "optim/total_tokens": 1947667005440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2929145097732544, "created_at": "2025-06-03T05:24:06.360316+00:00"} {"global_step": 232181, "acc_step": 0, "speed/wps": 5515.460171243546, "speed/FLOPS": 243755108884634.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043258752673864365, "optim/lr": 2.4192075144416458e-05, "optim/total_tokens": 1947675394048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2912734746932983, "created_at": "2025-06-03T05:24:09.336010+00:00"} {"global_step": 232182, "acc_step": 0, "speed/wps": 5524.3259274069305, "speed/FLOPS": 244146929928002.62, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04503101855516434, "optim/lr": 2.418852791932191e-05, "optim/total_tokens": 1947683782656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3070220947265625, "created_at": "2025-06-03T05:24:12.307227+00:00"} {"global_step": 232183, "acc_step": 0, "speed/wps": 5512.966237338936, "speed/FLOPS": 243644889771161.9, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04455578699707985, "optim/lr": 2.4184980694227365e-05, "optim/total_tokens": 1947692171264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2850383520126343, "created_at": "2025-06-03T05:24:15.283042+00:00"} {"global_step": 232184, "acc_step": 0, "speed/wps": 5511.538453273097, "speed/FLOPS": 243581789023513.2, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04557044059038162, "optim/lr": 2.4181433469133042e-05, "optim/total_tokens": 1947700559872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2959325313568115, "created_at": "2025-06-03T05:24:18.260993+00:00"} {"global_step": 232185, "acc_step": 0, "speed/wps": 5508.486852855111, "speed/FLOPS": 243446923904545.06, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042928297072649, "optim/lr": 2.4177886244038492e-05, "optim/total_tokens": 1947708948480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2985790967941284, "created_at": "2025-06-03T05:24:21.243786+00:00"} {"global_step": 232186, "acc_step": 0, "speed/wps": 5515.855314306011, "speed/FLOPS": 243772572185470.2, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05089057236909866, "optim/lr": 2.4174339018943946e-05, "optim/total_tokens": 1947717337088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.3023265600204468, "created_at": "2025-06-03T05:24:24.218760+00:00"} {"global_step": 232187, "acc_step": 0, "speed/wps": 5523.586172782785, "speed/FLOPS": 244114236560022.8, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.052610766142606735, "optim/lr": 2.41707917938494e-05, "optim/total_tokens": 1947725725696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2911714315414429, "created_at": "2025-06-03T05:24:27.189598+00:00"} {"global_step": 232188, "acc_step": 0, "speed/wps": 5517.714931747886, "speed/FLOPS": 243854757758016.16, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.049650888890028, "optim/lr": 2.4167244568755077e-05, "optim/total_tokens": 1947734114304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.287398099899292, "created_at": "2025-06-03T05:24:30.168381+00:00"} {"global_step": 232189, "acc_step": 0, "speed/wps": 5514.720558462222, "speed/FLOPS": 243722421785381.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0632898211479187, "optim/lr": 2.416369734366053e-05, "optim/total_tokens": 1947742502912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2763304710388184, "created_at": "2025-06-03T05:24:33.143928+00:00"} {"global_step": 232190, "acc_step": 0, "speed/wps": 5520.679640166945, "speed/FLOPS": 243985782695385.25, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0487302765250206, "optim/lr": 2.416015011856598e-05, "optim/total_tokens": 1947750891520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2891595363616943, "created_at": "2025-06-03T05:24:36.116503+00:00"} {"global_step": 232191, "acc_step": 0, "speed/wps": 5510.034761986903, "speed/FLOPS": 243515333565253.12, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.06496826559305191, "optim/lr": 2.4156602893471434e-05, "optim/total_tokens": 1947759280128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2816065549850464, "created_at": "2025-06-03T05:24:39.094305+00:00"} {"global_step": 232192, "acc_step": 0, "speed/wps": 5515.1194269697025, "speed/FLOPS": 243740049731818.22, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.62 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.62, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046598758548498154, "optim/lr": 2.415305566837711e-05, "optim/total_tokens": 1947767668736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2849489450454712, "created_at": "2025-06-03T05:24:42.070111+00:00"} {"global_step": 232193, "acc_step": 0, "speed/wps": 5503.137643306423, "speed/FLOPS": 243210516222229.6, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.053878869861364365, "optim/lr": 2.4149508443282565e-05, "optim/total_tokens": 1947776057344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3039934635162354, "created_at": "2025-06-03T05:24:45.051660+00:00"} {"global_step": 232194, "acc_step": 0, "speed/wps": 5517.900074943642, "speed/FLOPS": 243862940139619.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0480705201625824, "optim/lr": 2.414596121818802e-05, "optim/total_tokens": 1947784445952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2976934909820557, "created_at": "2025-06-03T05:24:48.026064+00:00"} {"global_step": 232195, "acc_step": 0, "speed/wps": 5518.770793826815, "speed/FLOPS": 243901421457512.78, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04915527626872063, "optim/lr": 2.414241399309347e-05, "optim/total_tokens": 1947792834560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3010553121566772, "created_at": "2025-06-03T05:24:51.005926+00:00"} {"global_step": 232196, "acc_step": 0, "speed/wps": 5493.977769365916, "speed/FLOPS": 242805696678544.2, "speed/curr_iter_time": 2.9813, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9813, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.63 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.63, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.051520057022571564, "optim/lr": 2.4138866767999146e-05, "optim/total_tokens": 1947801223168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2977389097213745, "created_at": "2025-06-03T05:24:53.995643+00:00"} {"global_step": 232197, "acc_step": 0, "speed/wps": 5520.922007955297, "speed/FLOPS": 243996494111079.6, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.6 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.6, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04945847764611244, "optim/lr": 2.41353195429046e-05, "optim/total_tokens": 1947809611776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2905856370925903, "created_at": "2025-06-03T05:24:56.974295+00:00"} {"global_step": 232198, "acc_step": 0, "speed/wps": 5516.39198373519, "speed/FLOPS": 243796290227316.75, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04611153528094292, "optim/lr": 2.4131772317810053e-05, "optim/total_tokens": 1947818000384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.296613335609436, "created_at": "2025-06-03T05:24:59.951378+00:00"} {"global_step": 232199, "acc_step": 0, "speed/wps": 5520.430208493551, "speed/FLOPS": 243974759092128.25, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04331459850072861, "optim/lr": 2.4128225092715507e-05, "optim/total_tokens": 1947826388992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2921780347824097, "created_at": "2025-06-03T05:25:02.923742+00:00"} {"global_step": 232200, "acc_step": 0, "speed/wps": 5511.339609992756, "speed/FLOPS": 243573001168294.28, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.61 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.61, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046819351613521576, "optim/lr": 2.412467786762118e-05, "optim/total_tokens": 1947834777600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.304246187210083, "created_at": "2025-06-03T05:25:05.901536+00:00"} {"global_step": 232201, "acc_step": 0, "speed/wps": 247.23277355148326, "speed/FLOPS": 10926423138924.518, "speed/curr_iter_time": 2.8909, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.8909, "speed/est_time_elapsed": "7.77 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 186.46, "speed/est_time_elapsed_days": 7.77, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.047030188143253326, "optim/lr": 2.4121130642526634e-05, "optim/total_tokens": 1947843166208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.287305235862732, "created_at": "2025-06-03T05:26:12.178301+00:00"} {"global_step": 232202, "acc_step": 0, "speed/wps": 5600.547936259149, "speed/FLOPS": 247515552579662.34, "speed/curr_iter_time": 2.9242, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9242, "speed/est_time_elapsed": "7.86 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 188.61, "speed/est_time_elapsed_days": 7.86, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04273271933197975, "optim/lr": 2.4117583417432088e-05, "optim/total_tokens": 1947851554816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3049395084381104, "created_at": "2025-06-03T05:26:15.112693+00:00"} {"global_step": 232203, "acc_step": 0, "speed/wps": 5568.2237839445925, "speed/FLOPS": 246086990497368.94, "speed/curr_iter_time": 2.9404, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9404, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 189.66, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05060969293117523, "optim/lr": 2.411403619233754e-05, "optim/total_tokens": 1947859943424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.3009542226791382, "created_at": "2025-06-03T05:26:18.061315+00:00"} {"global_step": 232204, "acc_step": 0, "speed/wps": 5547.443717200302, "speed/FLOPS": 245168617909294.8, "speed/curr_iter_time": 2.9524, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9524, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 190.43, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04304242134094238, "optim/lr": 2.4110488967243215e-05, "optim/total_tokens": 1947868332032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2900456190109253, "created_at": "2025-06-03T05:26:21.022636+00:00"} {"global_step": 232205, "acc_step": 0, "speed/wps": 5530.621665999041, "speed/FLOPS": 244425169349262.6, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.02, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04898003861308098, "optim/lr": 2.410694174214867e-05, "optim/total_tokens": 1947876720640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.28489351272583, "created_at": "2025-06-03T05:26:23.990474+00:00"} {"global_step": 232206, "acc_step": 0, "speed/wps": 5572.771184490759, "speed/FLOPS": 246287962325803.5, "speed/curr_iter_time": 2.9383, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9383, "speed/est_time_elapsed": "7.9 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 189.53, "speed/est_time_elapsed_days": 7.9, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042986221611499786, "optim/lr": 2.4103394517054123e-05, "optim/total_tokens": 1947885109248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2922216653823853, "created_at": "2025-06-03T05:26:26.938405+00:00"} {"global_step": 232207, "acc_step": 0, "speed/wps": 5555.443307852126, "speed/FLOPS": 245522158870488.7, "speed/curr_iter_time": 2.9483, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9483, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04873787239193916, "optim/lr": 2.4099847291959576e-05, "optim/total_tokens": 1947893497856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.287136435508728, "created_at": "2025-06-03T05:26:29.896762+00:00"} {"global_step": 232208, "acc_step": 0, "speed/wps": 5545.818131180915, "speed/FLOPS": 245096775327741.44, "speed/curr_iter_time": 2.9534, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9534, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 190.5, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04286568611860275, "optim/lr": 2.409630006686525e-05, "optim/total_tokens": 1947901886464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2974573373794556, "created_at": "2025-06-03T05:26:32.860097+00:00"} {"global_step": 232209, "acc_step": 0, "speed/wps": 5545.55044500715, "speed/FLOPS": 245084944969003.1, "speed/curr_iter_time": 2.9528, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9528, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 190.46, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04788761958479881, "optim/lr": 2.4092752841770704e-05, "optim/total_tokens": 1947910275072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.294301986694336, "created_at": "2025-06-03T05:26:35.825469+00:00"} {"global_step": 232210, "acc_step": 0, "speed/wps": 5542.05777746557, "speed/FLOPS": 244930586940758.34, "speed/curr_iter_time": 2.9555, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9555, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 190.64, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04385741800069809, "optim/lr": 2.4089205616676157e-05, "optim/total_tokens": 1947918663680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2890108823776245, "created_at": "2025-06-03T05:26:38.788514+00:00"} {"global_step": 232211, "acc_step": 0, "speed/wps": 5532.454169626162, "speed/FLOPS": 244506156629977.5, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 190.97, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05104038864374161, "optim/lr": 2.408565839158183e-05, "optim/total_tokens": 1947927052288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2940738201141357, "created_at": "2025-06-03T05:26:41.754913+00:00"} {"global_step": 232212, "acc_step": 0, "speed/wps": 5528.138995311737, "speed/FLOPS": 244315448012344.28, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.12, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042751941829919815, "optim/lr": 2.4082111166487285e-05, "optim/total_tokens": 1947935440896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3067909479141235, "created_at": "2025-06-03T05:26:44.723368+00:00"} {"global_step": 232213, "acc_step": 0, "speed/wps": 5519.536538816949, "speed/FLOPS": 243935263466638.53, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044687509536743164, "optim/lr": 2.407856394139274e-05, "optim/total_tokens": 1947943829504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2867246866226196, "created_at": "2025-06-03T05:26:47.700427+00:00"} {"global_step": 232214, "acc_step": 0, "speed/wps": 5522.596077252132, "speed/FLOPS": 244070479405336.28, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04268372803926468, "optim/lr": 2.4075016716298192e-05, "optim/total_tokens": 1947952218112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.290795087814331, "created_at": "2025-06-03T05:26:50.671929+00:00"} {"global_step": 232215, "acc_step": 0, "speed/wps": 5525.6077721164565, "speed/FLOPS": 244203580903087.7, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044406913220882416, "optim/lr": 2.407146949120387e-05, "optim/total_tokens": 1947960606720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3046475648880005, "created_at": "2025-06-03T05:26:53.647652+00:00"} {"global_step": 232216, "acc_step": 0, "speed/wps": 5532.821628970192, "speed/FLOPS": 244522396452156.2, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.041487209498882294, "optim/lr": 2.406792226610932e-05, "optim/total_tokens": 1947968995328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.3067375421524048, "created_at": "2025-06-03T05:26:56.614506+00:00"} {"global_step": 232217, "acc_step": 0, "speed/wps": 5528.147410962803, "speed/FLOPS": 244315819941046.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04370046406984329, "optim/lr": 2.4064375041014773e-05, "optim/total_tokens": 1947977383936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3012676239013672, "created_at": "2025-06-03T05:26:59.584588+00:00"} {"global_step": 232218, "acc_step": 0, "speed/wps": 5532.068431223491, "speed/FLOPS": 244489108966967.53, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042273469269275665, "optim/lr": 2.4060827815920227e-05, "optim/total_tokens": 1947985772544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.293368935585022, "created_at": "2025-06-03T05:27:02.554662+00:00"} {"global_step": 232219, "acc_step": 0, "speed/wps": 5523.148376558658, "speed/FLOPS": 244094888207760.62, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04402747377753258, "optim/lr": 2.4057280590825904e-05, "optim/total_tokens": 1947994161152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2813326120376587, "created_at": "2025-06-03T05:27:05.528485+00:00"} {"global_step": 232220, "acc_step": 0, "speed/wps": 5516.524021300587, "speed/FLOPS": 243802125611877.78, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046806950122117996, "optim/lr": 2.4053733365731357e-05, "optim/total_tokens": 1948002549760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2940558195114136, "created_at": "2025-06-03T05:27:08.507845+00:00"} {"global_step": 232221, "acc_step": 0, "speed/wps": 5507.8694470900355, "speed/FLOPS": 243419637729897.94, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.6 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.6, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04179045557975769, "optim/lr": 2.405018614063681e-05, "optim/total_tokens": 1948010938368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2906503677368164, "created_at": "2025-06-03T05:27:11.492044+00:00"} {"global_step": 232222, "acc_step": 0, "speed/wps": 5518.02274187932, "speed/FLOPS": 243868361390310.47, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042403556406497955, "optim/lr": 2.404663891554226e-05, "optim/total_tokens": 1948019326976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3108835220336914, "created_at": "2025-06-03T05:27:14.469851+00:00"} {"global_step": 232223, "acc_step": 0, "speed/wps": 5518.216234053694, "speed/FLOPS": 243876912754035.06, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.59 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.59, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042111944407224655, "optim/lr": 2.404309169044794e-05, "optim/total_tokens": 1948027715584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2926524877548218, "created_at": "2025-06-03T05:27:17.446180+00:00"} {"global_step": 232224, "acc_step": 0, "speed/wps": 5538.496072359331, "speed/FLOPS": 244773177805521.94, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04219071939587593, "optim/lr": 2.4039544465353392e-05, "optim/total_tokens": 1948036104192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.29243803024292, "created_at": "2025-06-03T05:27:20.415351+00:00"} {"global_step": 232225, "acc_step": 0, "speed/wps": 5529.24286945388, "speed/FLOPS": 244364233599286.94, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04257012903690338, "optim/lr": 2.4035997240258846e-05, "optim/total_tokens": 1948044492800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2958123683929443, "created_at": "2025-06-03T05:27:23.383763+00:00"} {"global_step": 232226, "acc_step": 0, "speed/wps": 5520.79919172708, "speed/FLOPS": 243991066262422.84, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04267195239663124, "optim/lr": 2.40324500151643e-05, "optim/total_tokens": 1948052881408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3000930547714233, "created_at": "2025-06-03T05:27:26.359485+00:00"} {"global_step": 232227, "acc_step": 0, "speed/wps": 5522.171546365352, "speed/FLOPS": 244051717313086.66, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042123280465602875, "optim/lr": 2.4028902790069973e-05, "optim/total_tokens": 1948061270016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2747697830200195, "created_at": "2025-06-03T05:27:29.333873+00:00"} {"global_step": 232228, "acc_step": 0, "speed/wps": 5520.843709352499, "speed/FLOPS": 243993033713604.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043222103267908096, "optim/lr": 2.4025355564975427e-05, "optim/total_tokens": 1948069658624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2928836345672607, "created_at": "2025-06-03T05:27:32.307098+00:00"} {"global_step": 232229, "acc_step": 0, "speed/wps": 5504.294572803086, "speed/FLOPS": 243261646584280.12, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.6 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.6, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04506262391805649, "optim/lr": 2.402180833988088e-05, "optim/total_tokens": 1948078047232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2909374237060547, "created_at": "2025-06-03T05:27:35.289043+00:00"} {"global_step": 232230, "acc_step": 0, "speed/wps": 5515.474016501607, "speed/FLOPS": 243755720774174.66, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042849354445934296, "optim/lr": 2.4018261114786334e-05, "optim/total_tokens": 1948086435840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2865217924118042, "created_at": "2025-06-03T05:27:38.265336+00:00"} {"global_step": 232231, "acc_step": 0, "speed/wps": 5522.544180290507, "speed/FLOPS": 244068185825265.2, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05189979076385498, "optim/lr": 2.4014713889692008e-05, "optim/total_tokens": 1948094824448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3026039600372314, "created_at": "2025-06-03T05:27:41.242096+00:00"} {"global_step": 232232, "acc_step": 0, "speed/wps": 5521.86641812345, "speed/FLOPS": 244038232206582.5, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04208327829837799, "optim/lr": 2.401116666459746e-05, "optim/total_tokens": 1948103213056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2925819158554077, "created_at": "2025-06-03T05:27:44.218475+00:00"} {"global_step": 232233, "acc_step": 0, "speed/wps": 5518.079069645347, "speed/FLOPS": 243870850789257.2, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04250723123550415, "optim/lr": 2.4007619439502915e-05, "optim/total_tokens": 1948111601664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3065129518508911, "created_at": "2025-06-03T05:27:47.192019+00:00"} {"global_step": 232234, "acc_step": 0, "speed/wps": 5526.559494254044, "speed/FLOPS": 244245642150213.53, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04310545325279236, "optim/lr": 2.400407221440837e-05, "optim/total_tokens": 1948119990272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2953603267669678, "created_at": "2025-06-03T05:27:50.166089+00:00"} {"global_step": 232235, "acc_step": 0, "speed/wps": 5519.03388329396, "speed/FLOPS": 243913048665346.6, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042318254709243774, "optim/lr": 2.4000524989314042e-05, "optim/total_tokens": 1948128378880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2739726305007935, "created_at": "2025-06-03T05:27:53.140966+00:00"} {"global_step": 232236, "acc_step": 0, "speed/wps": 5520.334248322013, "speed/FLOPS": 243970518143714.97, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04414112865924835, "optim/lr": 2.3996977764219496e-05, "optim/total_tokens": 1948136767488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.3020273447036743, "created_at": "2025-06-03T05:27:56.113168+00:00"} {"global_step": 232237, "acc_step": 0, "speed/wps": 5514.827723231585, "speed/FLOPS": 243727157919668.5, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04813997820019722, "optim/lr": 2.399343053912495e-05, "optim/total_tokens": 1948145156096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2907308340072632, "created_at": "2025-06-03T05:27:59.088657+00:00"} {"global_step": 232238, "acc_step": 0, "speed/wps": 5517.61271441416, "speed/FLOPS": 243850240275061.22, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042617492377758026, "optim/lr": 2.3989883314030624e-05, "optim/total_tokens": 1948153544704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2918237447738647, "created_at": "2025-06-03T05:28:02.062732+00:00"} {"global_step": 232239, "acc_step": 0, "speed/wps": 5508.273460703202, "speed/FLOPS": 243437493063670.75, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04605129361152649, "optim/lr": 2.3986336088936077e-05, "optim/total_tokens": 1948161933312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2887592315673828, "created_at": "2025-06-03T05:28:05.044842+00:00"} {"global_step": 232240, "acc_step": 0, "speed/wps": 5517.620500142106, "speed/FLOPS": 243850584364385.44, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0432269386947155, "optim/lr": 2.398278886384153e-05, "optim/total_tokens": 1948170321920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2829570770263672, "created_at": "2025-06-03T05:28:08.023066+00:00"} {"global_step": 232241, "acc_step": 0, "speed/wps": 5515.773809518002, "speed/FLOPS": 243768970091019.53, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0500490702688694, "optim/lr": 2.3979241638746984e-05, "optim/total_tokens": 1948178710528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2854564189910889, "created_at": "2025-06-03T05:28:11.001608+00:00"} {"global_step": 232242, "acc_step": 0, "speed/wps": 5515.068563865437, "speed/FLOPS": 243737801842950.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04227384179830551, "optim/lr": 2.397569441365266e-05, "optim/total_tokens": 1948187099136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3036757707595825, "created_at": "2025-06-03T05:28:13.978500+00:00"} {"global_step": 232243, "acc_step": 0, "speed/wps": 5514.109082785378, "speed/FLOPS": 243695397690281.38, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.047881193459033966, "optim/lr": 2.3972147188558112e-05, "optim/total_tokens": 1948195487744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2785714864730835, "created_at": "2025-06-03T05:28:16.958779+00:00"} {"global_step": 232244, "acc_step": 0, "speed/wps": 5520.8283185321025, "speed/FLOPS": 243992353518120.34, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04252035170793533, "optim/lr": 2.3968599963463565e-05, "optim/total_tokens": 1948203876352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.293968915939331, "created_at": "2025-06-03T05:28:19.933185+00:00"} {"global_step": 232245, "acc_step": 0, "speed/wps": 5525.991176699977, "speed/FLOPS": 244220525423236.72, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05096575617790222, "optim/lr": 2.396505273836902e-05, "optim/total_tokens": 1948212264960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2952256202697754, "created_at": "2025-06-03T05:28:22.903220+00:00"} {"global_step": 232246, "acc_step": 0, "speed/wps": 5503.091381613307, "speed/FLOPS": 243208471692182.7, "speed/curr_iter_time": 2.9757, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9757, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0453941784799099, "optim/lr": 2.3961505513274696e-05, "optim/total_tokens": 1948220653568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.292850375175476, "created_at": "2025-06-03T05:28:25.888495+00:00"} {"global_step": 232247, "acc_step": 0, "speed/wps": 5509.128295639931, "speed/FLOPS": 243475272392432.34, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.055471330881118774, "optim/lr": 2.395795828818015e-05, "optim/total_tokens": 1948229042176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.296932578086853, "created_at": "2025-06-03T05:28:28.867602+00:00"} {"global_step": 232248, "acc_step": 0, "speed/wps": 5505.970540928521, "speed/FLOPS": 243335715797041.8, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044223904609680176, "optim/lr": 2.39544110630856e-05, "optim/total_tokens": 1948237430784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2922579050064087, "created_at": "2025-06-03T05:28:31.851880+00:00"} {"global_step": 232249, "acc_step": 0, "speed/wps": 5523.188381511643, "speed/FLOPS": 244096656221918.62, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04999575391411781, "optim/lr": 2.3950863837991054e-05, "optim/total_tokens": 1948245819392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3002732992172241, "created_at": "2025-06-03T05:28:34.822989+00:00"} {"global_step": 232250, "acc_step": 0, "speed/wps": 5504.167104555848, "speed/FLOPS": 243256013140193.8, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04579468071460724, "optim/lr": 2.394731661289673e-05, "optim/total_tokens": 1948254208000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2913944721221924, "created_at": "2025-06-03T05:28:37.804463+00:00"} {"global_step": 232251, "acc_step": 0, "speed/wps": 5510.6586418765, "speed/FLOPS": 243542905863066.56, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.048552751541137695, "optim/lr": 2.3943769387802184e-05, "optim/total_tokens": 1948262596608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2767168283462524, "created_at": "2025-06-03T05:28:40.782265+00:00"} {"global_step": 232252, "acc_step": 0, "speed/wps": 5504.618543674461, "speed/FLOPS": 243275964438561.62, "speed/curr_iter_time": 2.9757, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9757, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045267704874277115, "optim/lr": 2.3940222162707638e-05, "optim/total_tokens": 1948270985216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2867393493652344, "created_at": "2025-06-03T05:28:43.763290+00:00"} {"global_step": 232253, "acc_step": 0, "speed/wps": 5513.294383134538, "speed/FLOPS": 243659392135725.12, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04353363439440727, "optim/lr": 2.3936674937613088e-05, "optim/total_tokens": 1948279373824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2882959842681885, "created_at": "2025-06-03T05:28:46.743493+00:00"} {"global_step": 232254, "acc_step": 0, "speed/wps": 5498.978843884305, "speed/FLOPS": 243026718574437.1, "speed/curr_iter_time": 2.9787, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9787, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.048223648220300674, "optim/lr": 2.3933127712518766e-05, "optim/total_tokens": 1948287762432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2850679159164429, "created_at": "2025-06-03T05:28:49.727650+00:00"} {"global_step": 232255, "acc_step": 0, "speed/wps": 5513.304919067538, "speed/FLOPS": 243659857770035.94, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042373549193143845, "optim/lr": 2.392958048742422e-05, "optim/total_tokens": 1948296151040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3000845909118652, "created_at": "2025-06-03T05:28:52.704226+00:00"} {"global_step": 232256, "acc_step": 0, "speed/wps": 5511.30593523826, "speed/FLOPS": 243571512916508.56, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.048781875520944595, "optim/lr": 2.3926033262329673e-05, "optim/total_tokens": 1948304539648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2953009605407715, "created_at": "2025-06-03T05:28:55.681559+00:00"} {"global_step": 232257, "acc_step": 0, "speed/wps": 5513.126473244053, "speed/FLOPS": 243651971378006.4, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04297623410820961, "optim/lr": 2.3922486037235126e-05, "optim/total_tokens": 1948312928256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2929039001464844, "created_at": "2025-06-03T05:28:58.660514+00:00"} {"global_step": 232258, "acc_step": 0, "speed/wps": 5518.4885769906905, "speed/FLOPS": 243888948917872.78, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04819915443658829, "optim/lr": 2.39189388121408e-05, "optim/total_tokens": 1948321316864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3069987297058105, "created_at": "2025-06-03T05:29:01.634655+00:00"} {"global_step": 232259, "acc_step": 0, "speed/wps": 5519.250798696825, "speed/FLOPS": 243922635215879.56, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042420972138643265, "optim/lr": 2.3915391587046254e-05, "optim/total_tokens": 1948329705472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2790164947509766, "created_at": "2025-06-03T05:29:04.610277+00:00"} {"global_step": 232260, "acc_step": 0, "speed/wps": 5525.464606658513, "speed/FLOPS": 244197253722633.8, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045007407665252686, "optim/lr": 2.3911844361951707e-05, "optim/total_tokens": 1948338094080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.301392674446106, "created_at": "2025-06-03T05:29:07.579730+00:00"} {"global_step": 232261, "acc_step": 0, "speed/wps": 5520.533726019422, "speed/FLOPS": 243979334036921.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042287372052669525, "optim/lr": 2.390829713685716e-05, "optim/total_tokens": 1948346482688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2888563871383667, "created_at": "2025-06-03T05:29:10.556498+00:00"} {"global_step": 232262, "acc_step": 0, "speed/wps": 5516.063908426155, "speed/FLOPS": 243781790977899.06, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0431140698492527, "optim/lr": 2.3904749911762835e-05, "optim/total_tokens": 1948354871296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2972995042800903, "created_at": "2025-06-03T05:29:13.533191+00:00"} {"global_step": 232263, "acc_step": 0, "speed/wps": 5493.1533727382275, "speed/FLOPS": 242769262567244.8, "speed/curr_iter_time": 2.981, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.981, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.58 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.58, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043205395340919495, "optim/lr": 2.390120268666829e-05, "optim/total_tokens": 1948363259904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2909612655639648, "created_at": "2025-06-03T05:29:16.525233+00:00"} {"global_step": 232264, "acc_step": 0, "speed/wps": 5503.531488363099, "speed/FLOPS": 243227922157852.94, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04157346487045288, "optim/lr": 2.3897655461573742e-05, "optim/total_tokens": 1948371648512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2997498512268066, "created_at": "2025-06-03T05:29:19.508084+00:00"} {"global_step": 232265, "acc_step": 0, "speed/wps": 5502.610246986935, "speed/FLOPS": 243187208004367.28, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.57 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.57, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04381989315152168, "optim/lr": 2.3894108236479416e-05, "optim/total_tokens": 1948380037120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.302916169166565, "created_at": "2025-06-03T05:29:22.493537+00:00"} {"global_step": 232266, "acc_step": 0, "speed/wps": 5521.7210560607555, "speed/FLOPS": 244031807947441.9, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04274003952741623, "optim/lr": 2.389056101138487e-05, "optim/total_tokens": 1948388425728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2859389781951904, "created_at": "2025-06-03T05:29:25.467068+00:00"} {"global_step": 232267, "acc_step": 0, "speed/wps": 5507.197162774369, "speed/FLOPS": 243389926204208.53, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04466924071311951, "optim/lr": 2.3887013786290323e-05, "optim/total_tokens": 1948396814336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3004029989242554, "created_at": "2025-06-03T05:29:28.449974+00:00"} {"global_step": 232268, "acc_step": 0, "speed/wps": 5517.42011938954, "speed/FLOPS": 243841728560763.7, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04433603212237358, "optim/lr": 2.3883466561195777e-05, "optim/total_tokens": 1948405202944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2979038953781128, "created_at": "2025-06-03T05:29:31.426504+00:00"} {"global_step": 232269, "acc_step": 0, "speed/wps": 5515.645900272197, "speed/FLOPS": 243763317157053.8, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0427742600440979, "optim/lr": 2.387991933610145e-05, "optim/total_tokens": 1948413591552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.3014994859695435, "created_at": "2025-06-03T05:29:34.404208+00:00"} {"global_step": 232270, "acc_step": 0, "speed/wps": 5509.537342559638, "speed/FLOPS": 243493350172591.47, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04315904900431633, "optim/lr": 2.3876372111006904e-05, "optim/total_tokens": 1948421980160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2928285598754883, "created_at": "2025-06-03T05:29:37.384882+00:00"} {"global_step": 232271, "acc_step": 0, "speed/wps": 5521.7363821005165, "speed/FLOPS": 244032485279953.56, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04253644123673439, "optim/lr": 2.3872824885912358e-05, "optim/total_tokens": 1948430368768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.29338538646698, "created_at": "2025-06-03T05:29:40.360179+00:00"} {"global_step": 232272, "acc_step": 0, "speed/wps": 5503.083241333153, "speed/FLOPS": 243208111933465.6, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04355620592832565, "optim/lr": 2.386927766081781e-05, "optim/total_tokens": 1948438757376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2968116998672485, "created_at": "2025-06-03T05:29:43.344858+00:00"} {"global_step": 232273, "acc_step": 0, "speed/wps": 5515.601689510068, "speed/FLOPS": 243761363267658.94, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042543135583400726, "optim/lr": 2.386573043572349e-05, "optim/total_tokens": 1948447145984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2890164852142334, "created_at": "2025-06-03T05:29:46.319757+00:00"} {"global_step": 232274, "acc_step": 0, "speed/wps": 5516.385867678578, "speed/FLOPS": 243796019928919.3, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04310212656855583, "optim/lr": 2.3862183210628942e-05, "optim/total_tokens": 1948455534592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2896348237991333, "created_at": "2025-06-03T05:29:49.298697+00:00"} {"global_step": 232275, "acc_step": 0, "speed/wps": 5511.790658882848, "speed/FLOPS": 243592935220558.88, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04180379584431648, "optim/lr": 2.3858635985534392e-05, "optim/total_tokens": 1948463923200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2978551387786865, "created_at": "2025-06-03T05:29:52.275434+00:00"} {"global_step": 232276, "acc_step": 0, "speed/wps": 5506.978416170341, "speed/FLOPS": 243380258723957.12, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04261484742164612, "optim/lr": 2.3855088760439846e-05, "optim/total_tokens": 1948472311808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3019849061965942, "created_at": "2025-06-03T05:29:55.255811+00:00"} {"global_step": 232277, "acc_step": 0, "speed/wps": 5518.317222679731, "speed/FLOPS": 243881375934399.22, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04311171919107437, "optim/lr": 2.3851541535345523e-05, "optim/total_tokens": 1948480700416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2901976108551025, "created_at": "2025-06-03T05:29:58.232388+00:00"} {"global_step": 232278, "acc_step": 0, "speed/wps": 5510.225097714932, "speed/FLOPS": 243523745430205.47, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042674049735069275, "optim/lr": 2.3847994310250977e-05, "optim/total_tokens": 1948489089024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.277819275856018, "created_at": "2025-06-03T05:30:01.210101+00:00"} {"global_step": 232279, "acc_step": 0, "speed/wps": 5509.912311019331, "speed/FLOPS": 243509921859247.34, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04213452711701393, "optim/lr": 2.384444708515643e-05, "optim/total_tokens": 1948497477632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2910685539245605, "created_at": "2025-06-03T05:30:04.191969+00:00"} {"global_step": 232280, "acc_step": 0, "speed/wps": 5499.359036324771, "speed/FLOPS": 243043521134304.38, "speed/curr_iter_time": 2.9774, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9774, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.56 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.56, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04148219898343086, "optim/lr": 2.384089986006188e-05, "optim/total_tokens": 1948505866240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2748950719833374, "created_at": "2025-06-03T05:30:07.176817+00:00"} {"global_step": 232281, "acc_step": 0, "speed/wps": 5505.885052319065, "speed/FLOPS": 243331937638074.25, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043914493173360825, "optim/lr": 2.3837352634967558e-05, "optim/total_tokens": 1948514254848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3001320362091064, "created_at": "2025-06-03T05:30:10.157420+00:00"} {"global_step": 232282, "acc_step": 0, "speed/wps": 5502.654190775353, "speed/FLOPS": 243189150094890.66, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04680575057864189, "optim/lr": 2.383380540987301e-05, "optim/total_tokens": 1948522643456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3091809749603271, "created_at": "2025-06-03T05:30:13.143645+00:00"} {"global_step": 232283, "acc_step": 0, "speed/wps": 5516.244335114405, "speed/FLOPS": 243789764914012.2, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043337102979421616, "optim/lr": 2.3830258184778465e-05, "optim/total_tokens": 1948531032064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2965916395187378, "created_at": "2025-06-03T05:30:16.118347+00:00"} {"global_step": 232284, "acc_step": 0, "speed/wps": 5521.235082485943, "speed/FLOPS": 244010330402873.44, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04348598048090935, "optim/lr": 2.382671095968392e-05, "optim/total_tokens": 1948539420672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2824318408966064, "created_at": "2025-06-03T05:30:19.092811+00:00"} {"global_step": 232285, "acc_step": 0, "speed/wps": 5519.974556749627, "speed/FLOPS": 243954621617283.84, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04360440373420715, "optim/lr": 2.3823163734589593e-05, "optim/total_tokens": 1948547809280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.292227864265442, "created_at": "2025-06-03T05:30:22.069408+00:00"} {"global_step": 232286, "acc_step": 0, "speed/wps": 5529.35789385326, "speed/FLOPS": 244369317088991.28, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04251076281070709, "optim/lr": 2.3819616509495046e-05, "optim/total_tokens": 1948556197888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2975090742111206, "created_at": "2025-06-03T05:30:25.038297+00:00"} {"global_step": 232287, "acc_step": 0, "speed/wps": 5528.879934386347, "speed/FLOPS": 244348193726972.03, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04236118122935295, "optim/lr": 2.38160692844005e-05, "optim/total_tokens": 1948564586496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2819633483886719, "created_at": "2025-06-03T05:30:28.008512+00:00"} {"global_step": 232288, "acc_step": 0, "speed/wps": 5516.947814022081, "speed/FLOPS": 243820855081000.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04588078334927559, "optim/lr": 2.3812522059305953e-05, "optim/total_tokens": 1948572975104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3023184537887573, "created_at": "2025-06-03T05:30:30.983009+00:00"} {"global_step": 232289, "acc_step": 0, "speed/wps": 5525.189773079343, "speed/FLOPS": 244185107485160.28, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04701554775238037, "optim/lr": 2.3808974834211627e-05, "optim/total_tokens": 1948581363712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2679003477096558, "created_at": "2025-06-03T05:30:33.953747+00:00"} {"global_step": 232290, "acc_step": 0, "speed/wps": 5525.919441645129, "speed/FLOPS": 244217355100985.75, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042802147567272186, "optim/lr": 2.380542760911708e-05, "optim/total_tokens": 1948589752320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.292587399482727, "created_at": "2025-06-03T05:30:36.925024+00:00"} {"global_step": 232291, "acc_step": 0, "speed/wps": 5516.925835443377, "speed/FLOPS": 243819883740317.88, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045747168362140656, "optim/lr": 2.3801880384022534e-05, "optim/total_tokens": 1948598140928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2857613563537598, "created_at": "2025-06-03T05:30:39.902613+00:00"} {"global_step": 232292, "acc_step": 0, "speed/wps": 5512.339994495812, "speed/FLOPS": 243617213042897.3, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046587347984313965, "optim/lr": 2.3798333158928208e-05, "optim/total_tokens": 1948606529536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2832874059677124, "created_at": "2025-06-03T05:30:42.880009+00:00"} {"global_step": 232293, "acc_step": 0, "speed/wps": 5508.794306983828, "speed/FLOPS": 243460511803341.5, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04312584176659584, "optim/lr": 2.3794785933833662e-05, "optim/total_tokens": 1948614918144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2957632541656494, "created_at": "2025-06-03T05:30:45.858386+00:00"} {"global_step": 232294, "acc_step": 0, "speed/wps": 5512.891532154261, "speed/FLOPS": 243641588184375.1, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044914934784173965, "optim/lr": 2.3791238708739115e-05, "optim/total_tokens": 1948623306752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2894537448883057, "created_at": "2025-06-03T05:30:48.838827+00:00"} {"global_step": 232295, "acc_step": 0, "speed/wps": 5513.493601633425, "speed/FLOPS": 243668196573683.2, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04399897903203964, "optim/lr": 2.378769148364457e-05, "optim/total_tokens": 1948631695360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.295220971107483, "created_at": "2025-06-03T05:30:51.818066+00:00"} {"global_step": 232296, "acc_step": 0, "speed/wps": 5506.5176306723215, "speed/FLOPS": 243359894363458.66, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.54 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.54, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044722650200128555, "optim/lr": 2.3784144258550243e-05, "optim/total_tokens": 1948640083968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2694275379180908, "created_at": "2025-06-03T05:30:54.800674+00:00"} {"global_step": 232297, "acc_step": 0, "speed/wps": 5498.196303786316, "speed/FLOPS": 242992134307509.3, "speed/curr_iter_time": 2.9782, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9782, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.55 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.55, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043476540595293045, "optim/lr": 2.3780597033455696e-05, "optim/total_tokens": 1948648472576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2967125177383423, "created_at": "2025-06-03T05:30:57.785416+00:00"} {"global_step": 232298, "acc_step": 0, "speed/wps": 5521.1220128688365, "speed/FLOPS": 244005333304540.1, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044618699699640274, "optim/lr": 2.377704980836115e-05, "optim/total_tokens": 1948656861184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.276922345161438, "created_at": "2025-06-03T05:31:00.757180+00:00"} {"global_step": 232299, "acc_step": 0, "speed/wps": 5530.579552064296, "speed/FLOPS": 244423308128905.5, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.049025487154722214, "optim/lr": 2.3773502583266604e-05, "optim/total_tokens": 1948665249792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2832425832748413, "created_at": "2025-06-03T05:31:03.724118+00:00"} {"global_step": 232300, "acc_step": 0, "speed/wps": 5523.986895496428, "speed/FLOPS": 244131946452881.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0428340844810009, "optim/lr": 2.376995535817228e-05, "optim/total_tokens": 1948673638400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.284829020500183, "created_at": "2025-06-03T05:31:06.694747+00:00"} {"global_step": 232301, "acc_step": 0, "speed/wps": 5518.440915642052, "speed/FLOPS": 243886842530215.84, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04525183141231537, "optim/lr": 2.376640813307773e-05, "optim/total_tokens": 1948682027008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2919921875, "created_at": "2025-06-03T05:31:09.667980+00:00"} {"global_step": 232302, "acc_step": 0, "speed/wps": 5515.177772890111, "speed/FLOPS": 243742628322858.75, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043951235711574554, "optim/lr": 2.3762860907983185e-05, "optim/total_tokens": 1948690415616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2969824075698853, "created_at": "2025-06-03T05:31:12.644760+00:00"} {"global_step": 232303, "acc_step": 0, "speed/wps": 5523.437159415604, "speed/FLOPS": 244107650931912.94, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05236166715621948, "optim/lr": 2.375931368288864e-05, "optim/total_tokens": 1948698804224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2848366498947144, "created_at": "2025-06-03T05:31:15.616044+00:00"} {"global_step": 232304, "acc_step": 0, "speed/wps": 5523.103470191547, "speed/FLOPS": 244092903576185.9, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043435245752334595, "optim/lr": 2.3755766457794316e-05, "optim/total_tokens": 1948707192832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2982021570205688, "created_at": "2025-06-03T05:31:18.587429+00:00"} {"global_step": 232305, "acc_step": 0, "speed/wps": 5510.437799662937, "speed/FLOPS": 243533145767600.03, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.056225527077913284, "optim/lr": 2.375221923269977e-05, "optim/total_tokens": 1948715581440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3081475496292114, "created_at": "2025-06-03T05:31:21.564966+00:00"} {"global_step": 232306, "acc_step": 0, "speed/wps": 5504.590835524836, "speed/FLOPS": 243274739880171.38, "speed/curr_iter_time": 2.9756, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9756, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043045997619628906, "optim/lr": 2.374867200760522e-05, "optim/total_tokens": 1948723970048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2788983583450317, "created_at": "2025-06-03T05:31:24.545381+00:00"} {"global_step": 232307, "acc_step": 0, "speed/wps": 5500.913751707438, "speed/FLOPS": 243112231596463.53, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.53 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.53, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04501684755086899, "optim/lr": 2.3745124782510673e-05, "optim/total_tokens": 1948732358656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2893184423446655, "created_at": "2025-06-03T05:31:27.528225+00:00"} {"global_step": 232308, "acc_step": 0, "speed/wps": 5536.964665795146, "speed/FLOPS": 244705497473834.3, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04325130581855774, "optim/lr": 2.374157755741635e-05, "optim/total_tokens": 1948740747264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2941796779632568, "created_at": "2025-06-03T05:31:30.492276+00:00"} {"global_step": 232309, "acc_step": 0, "speed/wps": 5522.750931811289, "speed/FLOPS": 244077323184233.53, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043102312833070755, "optim/lr": 2.3738030332321804e-05, "optim/total_tokens": 1948749135872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.279205322265625, "created_at": "2025-06-03T05:31:33.466420+00:00"} {"global_step": 232310, "acc_step": 0, "speed/wps": 5517.650355298452, "speed/FLOPS": 243851903809483.4, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04780413582921028, "optim/lr": 2.3734483107227257e-05, "optim/total_tokens": 1948757524480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2957077026367188, "created_at": "2025-06-03T05:31:36.441767+00:00"} {"global_step": 232311, "acc_step": 0, "speed/wps": 5519.359693754325, "speed/FLOPS": 243927447820045.66, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04380123317241669, "optim/lr": 2.3730935882132708e-05, "optim/total_tokens": 1948765913088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2870090007781982, "created_at": "2025-06-03T05:31:39.415492+00:00"} {"global_step": 232312, "acc_step": 0, "speed/wps": 5517.603730310185, "speed/FLOPS": 243849843223650.3, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04326377809047699, "optim/lr": 2.3727388657038385e-05, "optim/total_tokens": 1948774301696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2885252237319946, "created_at": "2025-06-03T05:31:42.388959+00:00"} {"global_step": 232313, "acc_step": 0, "speed/wps": 5508.742557831468, "speed/FLOPS": 243458224755683.34, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042255010455846786, "optim/lr": 2.372384143194384e-05, "optim/total_tokens": 1948782690304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3031145334243774, "created_at": "2025-06-03T05:31:45.367363+00:00"} {"global_step": 232314, "acc_step": 0, "speed/wps": 5510.713464315059, "speed/FLOPS": 243545328734244.22, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.52 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.52, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043037332594394684, "optim/lr": 2.3720294206849292e-05, "optim/total_tokens": 1948791078912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.300186276435852, "created_at": "2025-06-03T05:31:48.349019+00:00"} {"global_step": 232315, "acc_step": 0, "speed/wps": 5520.034463840169, "speed/FLOPS": 243957269204053.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04339952766895294, "optim/lr": 2.3716746981754746e-05, "optim/total_tokens": 1948799467520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2804614305496216, "created_at": "2025-06-03T05:31:51.321411+00:00"} {"global_step": 232316, "acc_step": 0, "speed/wps": 5522.575324851656, "speed/FLOPS": 244069562255455.66, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04257287457585335, "optim/lr": 2.371319975666042e-05, "optim/total_tokens": 1948807856128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2958600521087646, "created_at": "2025-06-03T05:31:54.295766+00:00"} {"global_step": 232317, "acc_step": 0, "speed/wps": 5524.881628734556, "speed/FLOPS": 244171489082346.44, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045768484473228455, "optim/lr": 2.3709652531565873e-05, "optim/total_tokens": 1948816244736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2952194213867188, "created_at": "2025-06-03T05:31:57.266723+00:00"} {"global_step": 232318, "acc_step": 0, "speed/wps": 5532.454552396743, "speed/FLOPS": 244506173546477.94, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04768626391887665, "optim/lr": 2.3706105306471327e-05, "optim/total_tokens": 1948824633344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2941185235977173, "created_at": "2025-06-03T05:32:00.232213+00:00"} {"global_step": 232319, "acc_step": 0, "speed/wps": 5529.449920815862, "speed/FLOPS": 244373384209701.62, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05504687875509262, "optim/lr": 2.3702558081377e-05, "optim/total_tokens": 1948833021952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2919249534606934, "created_at": "2025-06-03T05:32:03.199442+00:00"} {"global_step": 232320, "acc_step": 0, "speed/wps": 5516.704554209408, "speed/FLOPS": 243810104242396.5, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04255181923508644, "optim/lr": 2.3699010856282454e-05, "optim/total_tokens": 1948841410560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3021272420883179, "created_at": "2025-06-03T05:32:06.174711+00:00"} {"global_step": 232321, "acc_step": 0, "speed/wps": 5520.169465024348, "speed/FLOPS": 243963235565395.56, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04181886091828346, "optim/lr": 2.3695463631187908e-05, "optim/total_tokens": 1948849799168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.299971580505371, "created_at": "2025-06-03T05:32:09.146879+00:00"} {"global_step": 232322, "acc_step": 0, "speed/wps": 5522.283337633179, "speed/FLOPS": 244056657914925.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043011825531721115, "optim/lr": 2.369191640609336e-05, "optim/total_tokens": 1948858187776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2864121198654175, "created_at": "2025-06-03T05:32:12.118759+00:00"} {"global_step": 232323, "acc_step": 0, "speed/wps": 5511.294961917143, "speed/FLOPS": 243571027951881.78, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.51 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.51, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042739756405353546, "optim/lr": 2.3688369180999035e-05, "optim/total_tokens": 1948866576384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2826814651489258, "created_at": "2025-06-03T05:32:15.097616+00:00"} {"global_step": 232324, "acc_step": 0, "speed/wps": 5530.441901444697, "speed/FLOPS": 244417224676078.97, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04536055400967598, "optim/lr": 2.368482195590449e-05, "optim/total_tokens": 1948874964992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2857686281204224, "created_at": "2025-06-03T05:32:18.064709+00:00"} {"global_step": 232325, "acc_step": 0, "speed/wps": 5533.50392955159, "speed/FLOPS": 244552550645523.0, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05256269499659538, "optim/lr": 2.3681274730809942e-05, "optim/total_tokens": 1948883353600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2878109216690063, "created_at": "2025-06-03T05:32:21.030256+00:00"} {"global_step": 232326, "acc_step": 0, "speed/wps": 5531.32236817039, "speed/FLOPS": 244456136798717.38, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042128775268793106, "optim/lr": 2.3677727505715396e-05, "optim/total_tokens": 1948891742208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.303370714187622, "created_at": "2025-06-03T05:32:23.996372+00:00"} {"global_step": 232327, "acc_step": 0, "speed/wps": 5519.386107882987, "speed/FLOPS": 243928615189332.72, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04503508657217026, "optim/lr": 2.367418028062107e-05, "optim/total_tokens": 1948900130816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2850629091262817, "created_at": "2025-06-03T05:32:26.971366+00:00"} {"global_step": 232328, "acc_step": 0, "speed/wps": 5516.291728475681, "speed/FLOPS": 243791859457999.4, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04291670769453049, "optim/lr": 2.3670633055526523e-05, "optim/total_tokens": 1948908519424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2839560508728027, "created_at": "2025-06-03T05:32:29.950313+00:00"} {"global_step": 232329, "acc_step": 0, "speed/wps": 5518.522986580423, "speed/FLOPS": 243890469645614.72, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04457734897732735, "optim/lr": 2.3667085830431977e-05, "optim/total_tokens": 1948916908032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3014929294586182, "created_at": "2025-06-03T05:32:32.928081+00:00"} {"global_step": 232330, "acc_step": 0, "speed/wps": 5519.215235043093, "speed/FLOPS": 243921063484415.9, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04301303252577782, "optim/lr": 2.366353860533743e-05, "optim/total_tokens": 1948925296640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.278834342956543, "created_at": "2025-06-03T05:32:35.904918+00:00"} {"global_step": 232331, "acc_step": 0, "speed/wps": 5512.663676311597, "speed/FLOPS": 243631518122401.25, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04336429759860039, "optim/lr": 2.3659991380243108e-05, "optim/total_tokens": 1948933685248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.300449252128601, "created_at": "2025-06-03T05:32:38.881571+00:00"} {"global_step": 232332, "acc_step": 0, "speed/wps": 5521.728890649554, "speed/FLOPS": 244032154196165.75, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04264315962791443, "optim/lr": 2.365644415514856e-05, "optim/total_tokens": 1948942073856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3002146482467651, "created_at": "2025-06-03T05:32:41.854691+00:00"} {"global_step": 232333, "acc_step": 0, "speed/wps": 5532.343681197453, "speed/FLOPS": 244501273606959.6, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042935434728860855, "optim/lr": 2.3652896930054012e-05, "optim/total_tokens": 1948950462464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2815754413604736, "created_at": "2025-06-03T05:32:44.820259+00:00"} {"global_step": 232334, "acc_step": 0, "speed/wps": 5529.732772807792, "speed/FLOPS": 244385884819977.16, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04309042543172836, "optim/lr": 2.3649349704959465e-05, "optim/total_tokens": 1948958851072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.300672173500061, "created_at": "2025-06-03T05:32:47.790355+00:00"} {"global_step": 232335, "acc_step": 0, "speed/wps": 5533.130904177156, "speed/FLOPS": 244536064833289.97, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.05, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04520849511027336, "optim/lr": 2.3645802479865143e-05, "optim/total_tokens": 1948967239680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.276909589767456, "created_at": "2025-06-03T05:32:50.755680+00:00"} {"global_step": 232336, "acc_step": 0, "speed/wps": 5519.074429049212, "speed/FLOPS": 243914840580196.75, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04245296120643616, "optim/lr": 2.3642255254770596e-05, "optim/total_tokens": 1948975628288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2939358949661255, "created_at": "2025-06-03T05:32:53.728246+00:00"} {"global_step": 232337, "acc_step": 0, "speed/wps": 5535.77492851594, "speed/FLOPS": 244652917175720.8, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043637003749608994, "optim/lr": 2.363870802967605e-05, "optim/total_tokens": 1948984016896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.291981816291809, "created_at": "2025-06-03T05:32:56.696411+00:00"} {"global_step": 232338, "acc_step": 0, "speed/wps": 5513.248404934183, "speed/FLOPS": 243657360134607.16, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0421714261174202, "optim/lr": 2.36351608045815e-05, "optim/total_tokens": 1948992405504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2889808416366577, "created_at": "2025-06-03T05:32:59.673365+00:00"} {"global_step": 232339, "acc_step": 0, "speed/wps": 5515.436221579646, "speed/FLOPS": 243754050432075.9, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04479534178972244, "optim/lr": 2.3631613579487177e-05, "optim/total_tokens": 1949000794112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2998274564743042, "created_at": "2025-06-03T05:33:02.648207+00:00"} {"global_step": 232340, "acc_step": 0, "speed/wps": 5518.8354055948075, "speed/FLOPS": 243904276966945.03, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.041646040976047516, "optim/lr": 2.362806635439263e-05, "optim/total_tokens": 1949009182720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.282017469406128, "created_at": "2025-06-03T05:33:05.621302+00:00"} {"global_step": 232341, "acc_step": 0, "speed/wps": 5507.394513715187, "speed/FLOPS": 243398648105659.0, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.5 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.5, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043531130999326706, "optim/lr": 2.3624519129298084e-05, "optim/total_tokens": 1949017571328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2800114154815674, "created_at": "2025-06-03T05:33:08.604237+00:00"} {"global_step": 232342, "acc_step": 0, "speed/wps": 5529.376468796568, "speed/FLOPS": 244370138006410.3, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042618319392204285, "optim/lr": 2.3620971904203538e-05, "optim/total_tokens": 1949025959936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2904865741729736, "created_at": "2025-06-03T05:33:11.571286+00:00"} {"global_step": 232343, "acc_step": 0, "speed/wps": 5534.7674433830325, "speed/FLOPS": 244608391489622.72, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04363604262471199, "optim/lr": 2.3617424679109212e-05, "optim/total_tokens": 1949034348544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2745928764343262, "created_at": "2025-06-03T05:33:14.535434+00:00"} {"global_step": 232344, "acc_step": 0, "speed/wps": 5523.678827203463, "speed/FLOPS": 244118331411168.44, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043102387338876724, "optim/lr": 2.3613877454014665e-05, "optim/total_tokens": 1949042737152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3030657768249512, "created_at": "2025-06-03T05:33:17.510402+00:00"} {"global_step": 232345, "acc_step": 0, "speed/wps": 5523.07274232847, "speed/FLOPS": 244091545561917.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05272441357374191, "optim/lr": 2.361033022892012e-05, "optim/total_tokens": 1949051125760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2814531326293945, "created_at": "2025-06-03T05:33:20.481108+00:00"} {"global_step": 232346, "acc_step": 0, "speed/wps": 5511.1769650023125, "speed/FLOPS": 243565813092209.22, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042166754603385925, "optim/lr": 2.3606783003825793e-05, "optim/total_tokens": 1949059514368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3050274848937988, "created_at": "2025-06-03T05:33:23.459497+00:00"} {"global_step": 232347, "acc_step": 0, "speed/wps": 5513.480749521327, "speed/FLOPS": 243667628576111.53, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.49 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.49, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0591331385076046, "optim/lr": 2.3603235778731247e-05, "optim/total_tokens": 1949067902976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3113391399383545, "created_at": "2025-06-03T05:33:26.438626+00:00"} {"global_step": 232348, "acc_step": 0, "speed/wps": 5518.773357406659, "speed/FLOPS": 243901534754620.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04952654615044594, "optim/lr": 2.35996885536367e-05, "optim/total_tokens": 1949076291584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.295648217201233, "created_at": "2025-06-03T05:33:29.412898+00:00"} {"global_step": 232349, "acc_step": 0, "speed/wps": 5517.913679767047, "speed/FLOPS": 243863541403178.5, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05330535024404526, "optim/lr": 2.3596141328542154e-05, "optim/total_tokens": 1949084680192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2908354997634888, "created_at": "2025-06-03T05:33:32.388817+00:00"} {"global_step": 232350, "acc_step": 0, "speed/wps": 5524.025213586879, "speed/FLOPS": 244133639916349.2, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04671977832913399, "optim/lr": 2.3592594103447828e-05, "optim/total_tokens": 1949093068800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.303685188293457, "created_at": "2025-06-03T05:33:35.359140+00:00"} {"global_step": 232351, "acc_step": 0, "speed/wps": 5532.182811227277, "speed/FLOPS": 244494163977684.97, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045956287533044815, "optim/lr": 2.358904687835328e-05, "optim/total_tokens": 1949101457408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2832555770874023, "created_at": "2025-06-03T05:33:38.327004+00:00"} {"global_step": 232352, "acc_step": 0, "speed/wps": 5520.634662192804, "speed/FLOPS": 243983794899146.34, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04336254671216011, "optim/lr": 2.3585499653258735e-05, "optim/total_tokens": 1949109846016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2944728136062622, "created_at": "2025-06-03T05:33:41.303037+00:00"} {"global_step": 232353, "acc_step": 0, "speed/wps": 5524.2972476772, "speed/FLOPS": 244145662430744.72, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043554265052080154, "optim/lr": 2.358195242816419e-05, "optim/total_tokens": 1949118234624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2941993474960327, "created_at": "2025-06-03T05:33:44.275654+00:00"} {"global_step": 232354, "acc_step": 0, "speed/wps": 5519.1188314230185, "speed/FLOPS": 243916802937847.06, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04119259491562843, "optim/lr": 2.3578405203069862e-05, "optim/total_tokens": 1949126623232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2816096544265747, "created_at": "2025-06-03T05:33:47.252569+00:00"} {"global_step": 232355, "acc_step": 0, "speed/wps": 5537.672908176577, "speed/FLOPS": 244736798161980.44, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04240646958351135, "optim/lr": 2.3574857977975316e-05, "optim/total_tokens": 1949135011840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.288733959197998, "created_at": "2025-06-03T05:33:50.215161+00:00"} {"global_step": 232356, "acc_step": 0, "speed/wps": 5515.115289090814, "speed/FLOPS": 243739866858750.94, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04333009198307991, "optim/lr": 2.357131075288077e-05, "optim/total_tokens": 1949143400448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.289008378982544, "created_at": "2025-06-03T05:33:53.193969+00:00"} {"global_step": 232357, "acc_step": 0, "speed/wps": 5523.260945235089, "speed/FLOPS": 244099863167080.12, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045876313000917435, "optim/lr": 2.3567763527786223e-05, "optim/total_tokens": 1949151789056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2793391942977905, "created_at": "2025-06-03T05:33:56.167942+00:00"} {"global_step": 232358, "acc_step": 0, "speed/wps": 5527.639182079855, "speed/FLOPS": 244293358825771.16, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042878590524196625, "optim/lr": 2.35642163026919e-05, "optim/total_tokens": 1949160177664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2850561141967773, "created_at": "2025-06-03T05:33:59.139411+00:00"} {"global_step": 232359, "acc_step": 0, "speed/wps": 5527.181414848966, "speed/FLOPS": 244273127857230.9, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0452638603746891, "optim/lr": 2.356066907759735e-05, "optim/total_tokens": 1949168566272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.291808843612671, "created_at": "2025-06-03T05:34:02.111297+00:00"} {"global_step": 232360, "acc_step": 0, "speed/wps": 5530.776442370762, "speed/FLOPS": 244432009672675.38, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04247956722974777, "optim/lr": 2.3557121852502804e-05, "optim/total_tokens": 1949176954880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2962679862976074, "created_at": "2025-06-03T05:34:05.081433+00:00"} {"global_step": 232361, "acc_step": 0, "speed/wps": 5536.220157613747, "speed/FLOPS": 244672594022954.78, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 190.91, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04931947588920593, "optim/lr": 2.3553574627408258e-05, "optim/total_tokens": 1949185343488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2948607206344604, "created_at": "2025-06-03T05:34:08.049309+00:00"} {"global_step": 232362, "acc_step": 0, "speed/wps": 5525.789926724188, "speed/FLOPS": 244211631204397.62, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04364163801074028, "optim/lr": 2.3550027402313935e-05, "optim/total_tokens": 1949193732096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.3003318309783936, "created_at": "2025-06-03T05:34:11.019909+00:00"} {"global_step": 232363, "acc_step": 0, "speed/wps": 5523.39490163562, "speed/FLOPS": 244105783354332.6, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0460287481546402, "optim/lr": 2.354648017721939e-05, "optim/total_tokens": 1949202120704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2984530925750732, "created_at": "2025-06-03T05:34:13.990155+00:00"} {"global_step": 232364, "acc_step": 0, "speed/wps": 5527.7466519512045, "speed/FLOPS": 244298108444004.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04375767335295677, "optim/lr": 2.354293295212484e-05, "optim/total_tokens": 1949210509312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2909621000289917, "created_at": "2025-06-03T05:34:16.957946+00:00"} {"global_step": 232365, "acc_step": 0, "speed/wps": 5511.236429211472, "speed/FLOPS": 243568441105888.62, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.48 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.48, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04437451437115669, "optim/lr": 2.3539385727030292e-05, "optim/total_tokens": 1949218897920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2999153137207031, "created_at": "2025-06-03T05:34:19.937943+00:00"} {"global_step": 232366, "acc_step": 0, "speed/wps": 5521.378847215232, "speed/FLOPS": 244016684068053.4, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.47 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.47, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04268380627036095, "optim/lr": 2.353583850193597e-05, "optim/total_tokens": 1949227286528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.295092225074768, "created_at": "2025-06-03T05:34:22.910612+00:00"} {"global_step": 232367, "acc_step": 0, "speed/wps": 5525.457606204262, "speed/FLOPS": 244196944338387.53, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04891236871480942, "optim/lr": 2.3532291276841423e-05, "optim/total_tokens": 1949235675136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2903591394424438, "created_at": "2025-06-03T05:34:25.882566+00:00"} {"global_step": 232368, "acc_step": 0, "speed/wps": 5527.086313816588, "speed/FLOPS": 244268924878371.03, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04598385468125343, "optim/lr": 2.3528744051746877e-05, "optim/total_tokens": 1949244063744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2831692695617676, "created_at": "2025-06-03T05:34:28.851667+00:00"} {"global_step": 232369, "acc_step": 0, "speed/wps": 5524.05256787009, "speed/FLOPS": 244134848835655.22, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04485272988677025, "optim/lr": 2.3525196826652327e-05, "optim/total_tokens": 1949252452352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2914421558380127, "created_at": "2025-06-03T05:34:31.822230+00:00"} {"global_step": 232370, "acc_step": 0, "speed/wps": 5524.251473051536, "speed/FLOPS": 244143639426586.12, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04302981123328209, "optim/lr": 2.3521649601558004e-05, "optim/total_tokens": 1949260840960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.297704815864563, "created_at": "2025-06-03T05:34:34.796306+00:00"} {"global_step": 232371, "acc_step": 0, "speed/wps": 5523.74442981417, "speed/FLOPS": 244121230710777.1, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043243248015642166, "optim/lr": 2.3518102376463458e-05, "optim/total_tokens": 1949269229568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.300328016281128, "created_at": "2025-06-03T05:34:37.768509+00:00"} {"global_step": 232372, "acc_step": 0, "speed/wps": 5520.658541816168, "speed/FLOPS": 243984850256272.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04256262630224228, "optim/lr": 2.351455515136891e-05, "optim/total_tokens": 1949277618176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2901325225830078, "created_at": "2025-06-03T05:34:40.743081+00:00"} {"global_step": 232373, "acc_step": 0, "speed/wps": 5519.180177453589, "speed/FLOPS": 243919514118400.8, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046507060527801514, "optim/lr": 2.3511007926274365e-05, "optim/total_tokens": 1949286006784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2956229448318481, "created_at": "2025-06-03T05:34:43.718183+00:00"} {"global_step": 232374, "acc_step": 0, "speed/wps": 5527.125712052747, "speed/FLOPS": 244270666078750.8, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04442235082387924, "optim/lr": 2.350746070118004e-05, "optim/total_tokens": 1949294395392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.304030179977417, "created_at": "2025-06-03T05:34:46.687756+00:00"} {"global_step": 232375, "acc_step": 0, "speed/wps": 5538.365042267036, "speed/FLOPS": 244767386946115.3, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 190.9, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04338293895125389, "optim/lr": 2.3503913476085492e-05, "optim/total_tokens": 1949302784000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.27238929271698, "created_at": "2025-06-03T05:34:49.654059+00:00"} {"global_step": 232376, "acc_step": 0, "speed/wps": 5515.440653900995, "speed/FLOPS": 243754246317992.84, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04326394945383072, "optim/lr": 2.3500366250990946e-05, "optim/total_tokens": 1949311172608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.305982232093811, "created_at": "2025-06-03T05:34:52.629843+00:00"} {"global_step": 232377, "acc_step": 0, "speed/wps": 5535.513773378072, "speed/FLOPS": 244641375455340.25, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.01, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04343772679567337, "optim/lr": 2.349681902589662e-05, "optim/total_tokens": 1949319561216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2815766334533691, "created_at": "2025-06-03T05:34:55.593978+00:00"} {"global_step": 232378, "acc_step": 0, "speed/wps": 5535.327631812187, "speed/FLOPS": 244633148950887.03, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04296517372131348, "optim/lr": 2.3493271800802074e-05, "optim/total_tokens": 1949327949824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2959823608398438, "created_at": "2025-06-03T05:34:58.561950+00:00"} {"global_step": 232379, "acc_step": 0, "speed/wps": 5544.590544450765, "speed/FLOPS": 245042522277627.3, "speed/curr_iter_time": 2.9542, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9542, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 190.69, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04254154488444328, "optim/lr": 2.3489724575707527e-05, "optim/total_tokens": 1949336338432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2902947664260864, "created_at": "2025-06-03T05:35:01.523816+00:00"} {"global_step": 232380, "acc_step": 0, "speed/wps": 5532.55852137209, "speed/FLOPS": 244510768443026.8, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.11, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04271481931209564, "optim/lr": 2.348617735061298e-05, "optim/total_tokens": 1949344727040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2944954633712769, "created_at": "2025-06-03T05:35:04.489277+00:00"} {"global_step": 232381, "acc_step": 0, "speed/wps": 5509.327472404556, "speed/FLOPS": 243484074985949.66, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04628651961684227, "optim/lr": 2.3482630125518655e-05, "optim/total_tokens": 1949353115648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2952156066894531, "created_at": "2025-06-03T05:35:07.471524+00:00"} {"global_step": 232382, "acc_step": 0, "speed/wps": 5519.962510969876, "speed/FLOPS": 243954089255474.78, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042404137551784515, "optim/lr": 2.3479082900424108e-05, "optim/total_tokens": 1949361504256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2923518419265747, "created_at": "2025-06-03T05:35:10.447120+00:00"} {"global_step": 232383, "acc_step": 0, "speed/wps": 5509.700355399992, "speed/FLOPS": 243500554505759.75, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05519122630357742, "optim/lr": 2.3475535675329562e-05, "optim/total_tokens": 1949369892864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2929002046585083, "created_at": "2025-06-03T05:35:13.427047+00:00"} {"global_step": 232384, "acc_step": 0, "speed/wps": 5534.246105159437, "speed/FLOPS": 244585351008590.72, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.0, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045264340937137604, "optim/lr": 2.3471988450235015e-05, "optim/total_tokens": 1949378281472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2901333570480347, "created_at": "2025-06-03T05:35:16.391843+00:00"} {"global_step": 232385, "acc_step": 0, "speed/wps": 5520.203718897817, "speed/FLOPS": 243964749411275.7, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05529021471738815, "optim/lr": 2.3468441225140693e-05, "optim/total_tokens": 1949386670080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2750810384750366, "created_at": "2025-06-03T05:35:19.364060+00:00"} {"global_step": 232386, "acc_step": 0, "speed/wps": 5521.92458537054, "speed/FLOPS": 244040802901176.9, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.05604095011949539, "optim/lr": 2.3464894000046143e-05, "optim/total_tokens": 1949395058688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2844256162643433, "created_at": "2025-06-03T05:35:22.335206+00:00"} {"global_step": 232387, "acc_step": 0, "speed/wps": 5527.701998615828, "speed/FLOPS": 244296134995136.97, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04550092667341232, "optim/lr": 2.3461346774951596e-05, "optim/total_tokens": 1949403447296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.302381992340088, "created_at": "2025-06-03T05:35:25.303667+00:00"} {"global_step": 232388, "acc_step": 0, "speed/wps": 5515.057798157232, "speed/FLOPS": 243737326053751.88, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04950779303908348, "optim/lr": 2.345779954985705e-05, "optim/total_tokens": 1949411835904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2948118448257446, "created_at": "2025-06-03T05:35:28.278515+00:00"} {"global_step": 232389, "acc_step": 0, "speed/wps": 5511.464614294223, "speed/FLOPS": 243578525718589.12, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04402197152376175, "optim/lr": 2.3454252324762727e-05, "optim/total_tokens": 1949420224512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2915269136428833, "created_at": "2025-06-03T05:35:31.256234+00:00"} {"global_step": 232390, "acc_step": 0, "speed/wps": 5519.50620779996, "speed/FLOPS": 243933922990935.84, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04454680159687996, "optim/lr": 2.345070509966818e-05, "optim/total_tokens": 1949428613120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.27594792842865, "created_at": "2025-06-03T05:35:34.228596+00:00"} {"global_step": 232391, "acc_step": 0, "speed/wps": 5528.636531206202, "speed/FLOPS": 244337436552260.06, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04318941384553909, "optim/lr": 2.344715787457363e-05, "optim/total_tokens": 1949437001728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3127269744873047, "created_at": "2025-06-03T05:35:37.198187+00:00"} {"global_step": 232392, "acc_step": 0, "speed/wps": 5517.532947012038, "speed/FLOPS": 243846714964173.97, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04458533972501755, "optim/lr": 2.3443610649479085e-05, "optim/total_tokens": 1949445390336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.285751461982727, "created_at": "2025-06-03T05:35:40.172270+00:00"} {"global_step": 232393, "acc_step": 0, "speed/wps": 5522.57381136843, "speed/FLOPS": 244069495367243.78, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04270222783088684, "optim/lr": 2.3440063424384762e-05, "optim/total_tokens": 1949453778944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2941426038742065, "created_at": "2025-06-03T05:35:43.142976+00:00"} {"global_step": 232394, "acc_step": 0, "speed/wps": 5538.848860305127, "speed/FLOPS": 244788769226993.72, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 190.85, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042108237743377686, "optim/lr": 2.3436516199290215e-05, "optim/total_tokens": 1949462167552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2996671199798584, "created_at": "2025-06-03T05:35:46.109211+00:00"} {"global_step": 232395, "acc_step": 0, "speed/wps": 5527.147443337878, "speed/FLOPS": 244271626490322.78, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044201042503118515, "optim/lr": 2.343296897419567e-05, "optim/total_tokens": 1949470556160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3040566444396973, "created_at": "2025-06-03T05:35:49.078039+00:00"} {"global_step": 232396, "acc_step": 0, "speed/wps": 5520.883318380506, "speed/FLOPS": 243994784229905.06, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04285164922475815, "optim/lr": 2.342942174910112e-05, "optim/total_tokens": 1949478944768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2913962602615356, "created_at": "2025-06-03T05:35:52.052430+00:00"} {"global_step": 232397, "acc_step": 0, "speed/wps": 5518.859396042022, "speed/FLOPS": 243905337221917.7, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044984348118305206, "optim/lr": 2.3425874524006797e-05, "optim/total_tokens": 1949487333376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2902511358261108, "created_at": "2025-06-03T05:35:55.026772+00:00"} {"global_step": 232398, "acc_step": 0, "speed/wps": 5428.446361318751, "speed/FLOPS": 239909543863012.44, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.46 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.46, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044059351086616516, "optim/lr": 2.342232729891225e-05, "optim/total_tokens": 1949495721984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2961881160736084, "created_at": "2025-06-03T05:35:58.054853+00:00"} {"global_step": 232399, "acc_step": 0, "speed/wps": 5514.47517094731, "speed/FLOPS": 243711576913229.72, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04562903195619583, "optim/lr": 2.3418780073817704e-05, "optim/total_tokens": 1949504110592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2976841926574707, "created_at": "2025-06-03T05:36:01.034442+00:00"} {"global_step": 232400, "acc_step": 0, "speed/wps": 5513.960172011952, "speed/FLOPS": 243688816596290.38, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04354624077677727, "optim/lr": 2.3415232848723157e-05, "optim/total_tokens": 1949512499200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2931432723999023, "created_at": "2025-06-03T05:36:04.013466+00:00"} {"global_step": 232401, "acc_step": 0, "speed/wps": 5534.573873108438, "speed/FLOPS": 244599836674268.12, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 190.99, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04426182806491852, "optim/lr": 2.341168562362883e-05, "optim/total_tokens": 1949520887808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2709332704544067, "created_at": "2025-06-03T05:36:06.979247+00:00"} {"global_step": 232402, "acc_step": 0, "speed/wps": 5521.719258380619, "speed/FLOPS": 244031728499181.25, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.048011671751737595, "optim/lr": 2.3408138398534285e-05, "optim/total_tokens": 1949529276416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294931411743164, "created_at": "2025-06-03T05:36:09.950667+00:00"} {"global_step": 232403, "acc_step": 0, "speed/wps": 5539.494039358168, "speed/FLOPS": 244817282838812.38, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 190.89, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04289552941918373, "optim/lr": 2.340459117343974e-05, "optim/total_tokens": 1949537665024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2764042615890503, "created_at": "2025-06-03T05:36:12.916778+00:00"} {"global_step": 232404, "acc_step": 0, "speed/wps": 5518.768936607112, "speed/FLOPS": 243901339377908.0, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04815327376127243, "optim/lr": 2.3401043948345412e-05, "optim/total_tokens": 1949546053632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2889434099197388, "created_at": "2025-06-03T05:36:15.893742+00:00"} {"global_step": 232405, "acc_step": 0, "speed/wps": 5512.899222935521, "speed/FLOPS": 243641928077541.78, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.44 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.44, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042534489184617996, "optim/lr": 2.3397496723250866e-05, "optim/total_tokens": 1949554442240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2860110998153687, "created_at": "2025-06-03T05:36:18.870572+00:00"} {"global_step": 232406, "acc_step": 0, "speed/wps": 5507.514155261453, "speed/FLOPS": 243403935649623.03, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045335426926612854, "optim/lr": 2.339394949815632e-05, "optim/total_tokens": 1949562830848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2903984785079956, "created_at": "2025-06-03T05:36:21.849664+00:00"} {"global_step": 232407, "acc_step": 0, "speed/wps": 5509.020889052706, "speed/FLOPS": 243470525571033.72, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.45 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.45, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04213205724954605, "optim/lr": 2.3390402273061773e-05, "optim/total_tokens": 1949571219456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3096097707748413, "created_at": "2025-06-03T05:36:24.831715+00:00"} {"global_step": 232408, "acc_step": 0, "speed/wps": 5532.150536149986, "speed/FLOPS": 244492737584467.5, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.09, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.047255393117666245, "optim/lr": 2.3386855047967447e-05, "optim/total_tokens": 1949579608064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2888872623443604, "created_at": "2025-06-03T05:36:27.798403+00:00"} {"global_step": 232409, "acc_step": 0, "speed/wps": 5523.865725037157, "speed/FLOPS": 244126591338787.9, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042986590415239334, "optim/lr": 2.33833078228729e-05, "optim/total_tokens": 1949587996672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2968939542770386, "created_at": "2025-06-03T05:36:30.773901+00:00"} {"global_step": 232410, "acc_step": 0, "speed/wps": 5525.248736602693, "speed/FLOPS": 244187713371089.66, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045254647731781006, "optim/lr": 2.3379760597778354e-05, "optim/total_tokens": 1949596385280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2849924564361572, "created_at": "2025-06-03T05:36:33.743943+00:00"} {"global_step": 232411, "acc_step": 0, "speed/wps": 5532.64526746666, "speed/FLOPS": 244514602176400.06, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04196350276470184, "optim/lr": 2.3376213372683808e-05, "optim/total_tokens": 1949604773888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.298370361328125, "created_at": "2025-06-03T05:36:36.712770+00:00"} {"global_step": 232412, "acc_step": 0, "speed/wps": 5519.491378587089, "speed/FLOPS": 243933267615629.72, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046595167368650436, "optim/lr": 2.337266614758948e-05, "optim/total_tokens": 1949613162496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2904759645462036, "created_at": "2025-06-03T05:36:39.686280+00:00"} {"global_step": 232413, "acc_step": 0, "speed/wps": 5524.026325445613, "speed/FLOPS": 244133689054814.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042318619787693024, "optim/lr": 2.3369118922494935e-05, "optim/total_tokens": 1949621551104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2736320495605469, "created_at": "2025-06-03T05:36:42.658577+00:00"} {"global_step": 232414, "acc_step": 0, "speed/wps": 5515.141125325012, "speed/FLOPS": 243741008688060.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.045457709580659866, "optim/lr": 2.336557169740039e-05, "optim/total_tokens": 1949629939712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.307841420173645, "created_at": "2025-06-03T05:36:45.639870+00:00"} {"global_step": 232415, "acc_step": 0, "speed/wps": 5521.755055356271, "speed/FLOPS": 244033310542279.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.0422736294567585, "optim/lr": 2.3362024472305842e-05, "optim/total_tokens": 1949638328320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2816474437713623, "created_at": "2025-06-03T05:36:48.615593+00:00"} {"global_step": 232416, "acc_step": 0, "speed/wps": 5524.25577773963, "speed/FLOPS": 244143829671766.47, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042390406131744385, "optim/lr": 2.335847724721152e-05, "optim/total_tokens": 1949646716928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2917141914367676, "created_at": "2025-06-03T05:36:51.585507+00:00"} {"global_step": 232417, "acc_step": 0, "speed/wps": 5525.851704501745, "speed/FLOPS": 244214361465958.3, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04183555394411087, "optim/lr": 2.335493002211697e-05, "optim/total_tokens": 1949655105536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2910211086273193, "created_at": "2025-06-03T05:36:54.557518+00:00"} {"global_step": 232418, "acc_step": 0, "speed/wps": 5525.290400192124, "speed/FLOPS": 244189554688488.97, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04235611483454704, "optim/lr": 2.3351382797022423e-05, "optim/total_tokens": 1949663494144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2933074235916138, "created_at": "2025-06-03T05:36:57.528741+00:00"} {"global_step": 232419, "acc_step": 0, "speed/wps": 5534.666393733084, "speed/FLOPS": 244603925612313.97, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.07, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043122172355651855, "optim/lr": 2.3347835571927877e-05, "optim/total_tokens": 1949671882752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.275945782661438, "created_at": "2025-06-03T05:37:00.493167+00:00"} {"global_step": 232420, "acc_step": 0, "speed/wps": 5527.023160943785, "speed/FLOPS": 244266133844638.84, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04554352909326553, "optim/lr": 2.3344288346833554e-05, "optim/total_tokens": 1949680271360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2907755374908447, "created_at": "2025-06-03T05:37:03.461895+00:00"} {"global_step": 232421, "acc_step": 0, "speed/wps": 5522.57415419918, "speed/FLOPS": 244069510518608.16, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043111734092235565, "optim/lr": 2.3340741121739008e-05, "optim/total_tokens": 1949688659968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2884739637374878, "created_at": "2025-06-03T05:37:06.433543+00:00"} {"global_step": 232422, "acc_step": 0, "speed/wps": 5525.569379567665, "speed/FLOPS": 244201884148941.97, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04174107313156128, "optim/lr": 2.3337193896644458e-05, "optim/total_tokens": 1949697048576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2917265892028809, "created_at": "2025-06-03T05:37:09.402925+00:00"} {"global_step": 232423, "acc_step": 0, "speed/wps": 5513.041047777018, "speed/FLOPS": 243648196009610.66, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.43 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.43, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042986445128917694, "optim/lr": 2.333364667154991e-05, "optim/total_tokens": 1949705437184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2924141883850098, "created_at": "2025-06-03T05:37:12.382424+00:00"} {"global_step": 232424, "acc_step": 0, "speed/wps": 5518.036460675657, "speed/FLOPS": 243868967690889.38, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04249727353453636, "optim/lr": 2.333009944645559e-05, "optim/total_tokens": 1949713825792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.291872262954712, "created_at": "2025-06-03T05:37:15.359257+00:00"} {"global_step": 232425, "acc_step": 0, "speed/wps": 5531.845013870724, "speed/FLOPS": 244479235063528.94, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.1, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04202956706285477, "optim/lr": 2.3326552221361042e-05, "optim/total_tokens": 1949722214400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.300248146057129, "created_at": "2025-06-03T05:37:18.326501+00:00"} {"global_step": 232426, "acc_step": 0, "speed/wps": 5535.717956272402, "speed/FLOPS": 244650399294166.84, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.03, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04232130944728851, "optim/lr": 2.3323004996266496e-05, "optim/total_tokens": 1949730603008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3000214099884033, "created_at": "2025-06-03T05:37:21.290303+00:00"} {"global_step": 232427, "acc_step": 0, "speed/wps": 5524.004029814722, "speed/FLOPS": 244132703702048.28, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046016838401556015, "optim/lr": 2.3319457771171946e-05, "optim/total_tokens": 1949738991616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2903270721435547, "created_at": "2025-06-03T05:37:24.261791+00:00"} {"global_step": 232428, "acc_step": 0, "speed/wps": 5522.894374538536, "speed/FLOPS": 244083662618571.4, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.042429205030202866, "optim/lr": 2.3315910546077624e-05, "optim/total_tokens": 1949747380224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.289818286895752, "created_at": "2025-06-03T05:37:27.234875+00:00"} {"global_step": 232429, "acc_step": 0, "speed/wps": 5529.224742900783, "speed/FLOPS": 244363432498420.16, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.048967666923999786, "optim/lr": 2.3312363320983077e-05, "optim/total_tokens": 1949755768832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2904407978057861, "created_at": "2025-06-03T05:37:30.203261+00:00"} {"global_step": 232430, "acc_step": 0, "speed/wps": 5518.469993333446, "speed/FLOPS": 243888127615342.34, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04185991734266281, "optim/lr": 2.330881609588853e-05, "optim/total_tokens": 1949764157440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2986512184143066, "created_at": "2025-06-03T05:37:33.176338+00:00"} {"global_step": 232431, "acc_step": 0, "speed/wps": 5522.601343283621, "speed/FLOPS": 244070712136974.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04782060161232948, "optim/lr": 2.3305268870794205e-05, "optim/total_tokens": 1949772546048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.299793004989624, "created_at": "2025-06-03T05:37:36.148205+00:00"} {"global_step": 232432, "acc_step": 0, "speed/wps": 5517.811903312715, "speed/FLOPS": 243859043404836.12, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.42 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.42, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04574989899992943, "optim/lr": 2.3301721645699658e-05, "optim/total_tokens": 1949780934656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.28449547290802, "created_at": "2025-06-03T05:37:39.122427+00:00"} {"global_step": 232433, "acc_step": 0, "speed/wps": 5530.850448899493, "speed/FLOPS": 244435280382445.53, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04492385312914848, "optim/lr": 2.3298174420605112e-05, "optim/total_tokens": 1949789323264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2771004438400269, "created_at": "2025-06-03T05:37:42.089201+00:00"} {"global_step": 232434, "acc_step": 0, "speed/wps": 5534.597587043202, "speed/FLOPS": 244600884708805.78, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04676651209592819, "optim/lr": 2.3294627195510565e-05, "optim/total_tokens": 1949797711872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.298356533050537, "created_at": "2025-06-03T05:37:45.055863+00:00"} {"global_step": 232435, "acc_step": 0, "speed/wps": 5526.932258313273, "speed/FLOPS": 244262116413652.06, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.043806374073028564, "optim/lr": 2.329107997041624e-05, "optim/total_tokens": 1949806100480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2904179096221924, "created_at": "2025-06-03T05:37:48.027746+00:00"} {"global_step": 232436, "acc_step": 0, "speed/wps": 5531.995811591714, "speed/FLOPS": 244485899550944.0, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04650290310382843, "optim/lr": 2.3287532745321693e-05, "optim/total_tokens": 1949814489088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2928578853607178, "created_at": "2025-06-03T05:37:50.993827+00:00"} {"global_step": 232437, "acc_step": 0, "speed/wps": 5524.6366716156845, "speed/FLOPS": 244160663231496.5, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04272143915295601, "optim/lr": 2.3283985520227146e-05, "optim/total_tokens": 1949822877696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3030894994735718, "created_at": "2025-06-03T05:37:53.965727+00:00"} {"global_step": 232438, "acc_step": 0, "speed/wps": 5519.06465929829, "speed/FLOPS": 243914408807212.12, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.047642335295677185, "optim/lr": 2.32804382951326e-05, "optim/total_tokens": 1949831266304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2968013286590576, "created_at": "2025-06-03T05:37:56.938850+00:00"} {"global_step": 232439, "acc_step": 0, "speed/wps": 5526.941228109216, "speed/FLOPS": 244262512832721.16, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04457506164908409, "optim/lr": 2.3276891070038274e-05, "optim/total_tokens": 1949839654912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2934644222259521, "created_at": "2025-06-03T05:37:59.911827+00:00"} {"global_step": 232440, "acc_step": 0, "speed/wps": 5518.076967545295, "speed/FLOPS": 243870757887194.4, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04455818235874176, "optim/lr": 2.3273343844943727e-05, "optim/total_tokens": 1949848043520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.287689447402954, "created_at": "2025-06-03T05:38:02.887180+00:00"} {"global_step": 232441, "acc_step": 0, "speed/wps": 5526.29218099164, "speed/FLOPS": 244233828272248.6, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04475551098585129, "optim/lr": 2.326979661984918e-05, "optim/total_tokens": 1949856432128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2983216047286987, "created_at": "2025-06-03T05:38:05.861453+00:00"} {"global_step": 232442, "acc_step": 0, "speed/wps": 5514.8308562463835, "speed/FLOPS": 243727296382886.38, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.046919144690036774, "optim/lr": 2.3266249394754635e-05, "optim/total_tokens": 1949864820736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3021926879882812, "created_at": "2025-06-03T05:38:08.836410+00:00"} {"global_step": 232443, "acc_step": 0, "speed/wps": 5530.585880893254, "speed/FLOPS": 244423587830751.6, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.047895397990942, "optim/lr": 2.3262702169660312e-05, "optim/total_tokens": 1949873209344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2824554443359375, "created_at": "2025-06-03T05:38:11.806567+00:00"} {"global_step": 232444, "acc_step": 0, "speed/wps": 5520.73755892049, "speed/FLOPS": 243988342407836.88, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.044276319444179535, "optim/lr": 2.3259154944565762e-05, "optim/total_tokens": 1949881597952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2964510917663574, "created_at": "2025-06-03T05:38:14.779156+00:00"} {"global_step": 232445, "acc_step": 0, "speed/wps": 5529.74152052075, "speed/FLOPS": 244386271424115.06, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.2, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042871151119470596, "optim/lr": 2.3255607719471216e-05, "optim/total_tokens": 1949889986560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3045927286148071, "created_at": "2025-06-03T05:38:17.746443+00:00"} {"global_step": 232446, "acc_step": 0, "speed/wps": 5509.6674215285075, "speed/FLOPS": 243499098997210.97, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04518526792526245, "optim/lr": 2.325206049437667e-05, "optim/total_tokens": 1949898375168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2903026342391968, "created_at": "2025-06-03T05:38:20.724675+00:00"} {"global_step": 232447, "acc_step": 0, "speed/wps": 5527.9211436166315, "speed/FLOPS": 244305820082486.7, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043744295835494995, "optim/lr": 2.3248513269282347e-05, "optim/total_tokens": 1949906763776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2869141101837158, "created_at": "2025-06-03T05:38:23.693203+00:00"} {"global_step": 232448, "acc_step": 0, "speed/wps": 5524.142688012927, "speed/FLOPS": 244138831684691.9, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043409254401922226, "optim/lr": 2.32449660441878e-05, "optim/total_tokens": 1949915152384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2862902879714966, "created_at": "2025-06-03T05:38:26.664363+00:00"} {"global_step": 232449, "acc_step": 0, "speed/wps": 5511.779742777301, "speed/FLOPS": 243592452784567.38, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.41 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.41, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04366130754351616, "optim/lr": 2.324141881909325e-05, "optim/total_tokens": 1949923540992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2899587154388428, "created_at": "2025-06-03T05:38:29.645426+00:00"} {"global_step": 232450, "acc_step": 0, "speed/wps": 5525.951591984232, "speed/FLOPS": 244218775981413.75, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042146652936935425, "optim/lr": 2.3237871593998704e-05, "optim/total_tokens": 1949931929600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.289592981338501, "created_at": "2025-06-03T05:38:32.615028+00:00"} {"global_step": 232451, "acc_step": 0, "speed/wps": 5543.802156532855, "speed/FLOPS": 245007679566990.88, "speed/curr_iter_time": 2.9546, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9546, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 190.78, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043519582599401474, "optim/lr": 2.323432436890438e-05, "optim/total_tokens": 1949940318208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.285969614982605, "created_at": "2025-06-03T05:38:35.574890+00:00"} {"global_step": 232452, "acc_step": 0, "speed/wps": 5526.5507084274195, "speed/FLOPS": 244245253861646.7, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042478445917367935, "optim/lr": 2.3230777143809835e-05, "optim/total_tokens": 1949948706816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2945300340652466, "created_at": "2025-06-03T05:38:38.545292+00:00"} {"global_step": 232453, "acc_step": 0, "speed/wps": 5538.693303970801, "speed/FLOPS": 244781894433226.0, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 190.95, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04490720480680466, "optim/lr": 2.322722991871529e-05, "optim/total_tokens": 1949957095424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2879054546356201, "created_at": "2025-06-03T05:38:41.512001+00:00"} {"global_step": 232454, "acc_step": 0, "speed/wps": 5511.281192882495, "speed/FLOPS": 243570419431026.62, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.23, "optim/grad_norm": 0.04220264405012131, "optim/lr": 2.322368269362074e-05, "optim/total_tokens": 1949965484032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.282129168510437, "created_at": "2025-06-03T05:38:44.489768+00:00"} {"global_step": 232455, "acc_step": 0, "speed/wps": 5517.553051530261, "speed/FLOPS": 243847603480975.2, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04476919770240784, "optim/lr": 2.3220135468526416e-05, "optim/total_tokens": 1949973872640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2920323610305786, "created_at": "2025-06-03T05:38:47.465216+00:00"} {"global_step": 232456, "acc_step": 0, "speed/wps": 5515.396808254591, "speed/FLOPS": 243752308564844.16, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04441510885953903, "optim/lr": 2.321658824343187e-05, "optim/total_tokens": 1949982261248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2921596765518188, "created_at": "2025-06-03T05:38:50.444119+00:00"} {"global_step": 232457, "acc_step": 0, "speed/wps": 5517.892201025357, "speed/FLOPS": 243862592152733.97, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04218258708715439, "optim/lr": 2.3213041018337323e-05, "optim/total_tokens": 1949990649856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2696441411972046, "created_at": "2025-06-03T05:38:53.419585+00:00"} {"global_step": 232458, "acc_step": 0, "speed/wps": 5522.493803377009, "speed/FLOPS": 244065959423540.97, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04674730822443962, "optim/lr": 2.3209493793242997e-05, "optim/total_tokens": 1949999038464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2952569723129272, "created_at": "2025-06-03T05:38:56.395723+00:00"} {"global_step": 232459, "acc_step": 0, "speed/wps": 5528.890199388507, "speed/FLOPS": 244348647387526.5, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044948760420084, "optim/lr": 2.320594656814845e-05, "optim/total_tokens": 1950007427072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2823857069015503, "created_at": "2025-06-03T05:38:59.362932+00:00"} {"global_step": 232460, "acc_step": 0, "speed/wps": 5529.045494885342, "speed/FLOPS": 244355510653612.2, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04737759009003639, "optim/lr": 2.3202399343053904e-05, "optim/total_tokens": 1950015815680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.288857102394104, "created_at": "2025-06-03T05:39:02.335774+00:00"} {"global_step": 232461, "acc_step": 0, "speed/wps": 5515.866311847602, "speed/FLOPS": 243773058220518.03, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048422034829854965, "optim/lr": 2.3198852117959358e-05, "optim/total_tokens": 1950024204288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.283647894859314, "created_at": "2025-06-03T05:39:05.310359+00:00"} {"global_step": 232462, "acc_step": 0, "speed/wps": 5533.99231913126, "speed/FLOPS": 244574134965139.94, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04485419765114784, "optim/lr": 2.319530489286503e-05, "optim/total_tokens": 1950032592896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2940232753753662, "created_at": "2025-06-03T05:39:08.278708+00:00"} {"global_step": 232463, "acc_step": 0, "speed/wps": 5517.117348304897, "speed/FLOPS": 243828347628545.38, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046222150325775146, "optim/lr": 2.3191757667770485e-05, "optim/total_tokens": 1950040981504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2872314453125, "created_at": "2025-06-03T05:39:11.253967+00:00"} {"global_step": 232464, "acc_step": 0, "speed/wps": 5507.913522772673, "speed/FLOPS": 243421585649470.72, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04321412369608879, "optim/lr": 2.318821044267594e-05, "optim/total_tokens": 1950049370112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2920866012573242, "created_at": "2025-06-03T05:39:14.232822+00:00"} {"global_step": 232465, "acc_step": 0, "speed/wps": 5515.247142782634, "speed/FLOPS": 243745694117041.0, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04476415738463402, "optim/lr": 2.3184663217581392e-05, "optim/total_tokens": 1950057758720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3019273281097412, "created_at": "2025-06-03T05:39:17.211222+00:00"} {"global_step": 232466, "acc_step": 0, "speed/wps": 5507.029742579057, "speed/FLOPS": 243382527088510.0, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.4 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.4, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04459301009774208, "optim/lr": 2.3181115992487066e-05, "optim/total_tokens": 1950066147328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2995109558105469, "created_at": "2025-06-03T05:39:20.191775+00:00"} {"global_step": 232467, "acc_step": 0, "speed/wps": 5522.028222648094, "speed/FLOPS": 244045383138381.16, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045051757246255875, "optim/lr": 2.317756876739252e-05, "optim/total_tokens": 1950074535936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2910135984420776, "created_at": "2025-06-03T05:39:23.164083+00:00"} {"global_step": 232468, "acc_step": 0, "speed/wps": 5522.649478744221, "speed/FLOPS": 244072839477952.97, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.047991350293159485, "optim/lr": 2.3174021542297973e-05, "optim/total_tokens": 1950082924544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.316798448562622, "created_at": "2025-06-03T05:39:26.134915+00:00"} {"global_step": 232469, "acc_step": 0, "speed/wps": 5526.412620708941, "speed/FLOPS": 244239151091286.97, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045788709074258804, "optim/lr": 2.3170474317203427e-05, "optim/total_tokens": 1950091313152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2952101230621338, "created_at": "2025-06-03T05:39:29.104107+00:00"} {"global_step": 232470, "acc_step": 0, "speed/wps": 5527.890256167131, "speed/FLOPS": 244304455015315.06, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046398501843214035, "optim/lr": 2.31669270921091e-05, "optim/total_tokens": 1950099701760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.286755084991455, "created_at": "2025-06-03T05:39:32.075406+00:00"} {"global_step": 232471, "acc_step": 0, "speed/wps": 5515.148001974411, "speed/FLOPS": 243741312600766.2, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.047066766768693924, "optim/lr": 2.3163379867014554e-05, "optim/total_tokens": 1950108090368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2772382497787476, "created_at": "2025-06-03T05:39:35.054041+00:00"} {"global_step": 232472, "acc_step": 0, "speed/wps": 5526.290654186546, "speed/FLOPS": 244233760795278.34, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.34, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04471684992313385, "optim/lr": 2.3159832641920008e-05, "optim/total_tokens": 1950116478976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.282097339630127, "created_at": "2025-06-03T05:39:38.023135+00:00"} {"global_step": 232473, "acc_step": 0, "speed/wps": 5524.521711705823, "speed/FLOPS": 244155582591898.78, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04350222274661064, "optim/lr": 2.3156285416825462e-05, "optim/total_tokens": 1950124867584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3134299516677856, "created_at": "2025-06-03T05:39:40.997081+00:00"} {"global_step": 232474, "acc_step": 0, "speed/wps": 5509.810427005906, "speed/FLOPS": 243505419107343.56, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.39 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.39, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04624786600470543, "optim/lr": 2.315273819173114e-05, "optim/total_tokens": 1950133256192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2987110614776611, "created_at": "2025-06-03T05:39:43.975005+00:00"} {"global_step": 232475, "acc_step": 0, "speed/wps": 5539.662371733027, "speed/FLOPS": 244824722268177.9, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 190.88, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04554292932152748, "optim/lr": 2.314919096663659e-05, "optim/total_tokens": 1950141644800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2826347351074219, "created_at": "2025-06-03T05:39:46.942020+00:00"} {"global_step": 232476, "acc_step": 0, "speed/wps": 5527.625478888276, "speed/FLOPS": 244292753214842.62, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04287964850664139, "optim/lr": 2.3145643741542043e-05, "optim/total_tokens": 1950150033408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3069586753845215, "created_at": "2025-06-03T05:39:49.910755+00:00"} {"global_step": 232477, "acc_step": 0, "speed/wps": 5531.167918184074, "speed/FLOPS": 244449310899868.88, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.23, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045041363686323166, "optim/lr": 2.3142096516447496e-05, "optim/total_tokens": 1950158422016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.3025068044662476, "created_at": "2025-06-03T05:39:52.878256+00:00"} {"global_step": 232478, "acc_step": 0, "speed/wps": 5523.91925949263, "speed/FLOPS": 244128957287705.62, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04243478178977966, "optim/lr": 2.3138549291353174e-05, "optim/total_tokens": 1950166810624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2819633483886719, "created_at": "2025-06-03T05:39:55.851143+00:00"} {"global_step": 232479, "acc_step": 0, "speed/wps": 5520.0046049617995, "speed/FLOPS": 243955949594461.22, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04494152590632439, "optim/lr": 2.3135002066258627e-05, "optim/total_tokens": 1950175199232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2804151773452759, "created_at": "2025-06-03T05:39:58.824147+00:00"} {"global_step": 232480, "acc_step": 0, "speed/wps": 5518.26283953525, "speed/FLOPS": 243878972477771.38, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04264291748404503, "optim/lr": 2.3131454841164077e-05, "optim/total_tokens": 1950183587840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2903037071228027, "created_at": "2025-06-03T05:40:01.801286+00:00"} {"global_step": 232481, "acc_step": 0, "speed/wps": 5524.945148244949, "speed/FLOPS": 244174296319583.5, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043116211891174316, "optim/lr": 2.312790761606953e-05, "optim/total_tokens": 1950191976448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2961175441741943, "created_at": "2025-06-03T05:40:04.772494+00:00"} {"global_step": 232482, "acc_step": 0, "speed/wps": 5513.675982719855, "speed/FLOPS": 243676256884192.38, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04213894531130791, "optim/lr": 2.3124360390975208e-05, "optim/total_tokens": 1950200365056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.293820858001709, "created_at": "2025-06-03T05:40:07.752007+00:00"} {"global_step": 232483, "acc_step": 0, "speed/wps": 5508.81015389533, "speed/FLOPS": 243461212155718.03, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.38 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.38, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048585642129182816, "optim/lr": 2.3120813165880662e-05, "optim/total_tokens": 1950208753664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2885812520980835, "created_at": "2025-06-03T05:40:10.734871+00:00"} {"global_step": 232484, "acc_step": 0, "speed/wps": 5516.420239374935, "speed/FLOPS": 243797538981968.0, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044271182268857956, "optim/lr": 2.3117265940786115e-05, "optim/total_tokens": 1950217142272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.295566201210022, "created_at": "2025-06-03T05:40:13.713652+00:00"} {"global_step": 232485, "acc_step": 0, "speed/wps": 5532.130601283847, "speed/FLOPS": 244491856565420.06, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04459613561630249, "optim/lr": 2.311371871569179e-05, "optim/total_tokens": 1950225530880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3013781309127808, "created_at": "2025-06-03T05:40:16.680431+00:00"} {"global_step": 232486, "acc_step": 0, "speed/wps": 5532.532635222988, "speed/FLOPS": 244509624407733.84, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.19, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044280048459768295, "optim/lr": 2.3110171490597243e-05, "optim/total_tokens": 1950233919488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2842156887054443, "created_at": "2025-06-03T05:40:19.646583+00:00"} {"global_step": 232487, "acc_step": 0, "speed/wps": 5518.507389711743, "speed/FLOPS": 243889780343851.06, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042100295424461365, "optim/lr": 2.3106624265502696e-05, "optim/total_tokens": 1950242308096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2900313138961792, "created_at": "2025-06-03T05:40:22.622765+00:00"} {"global_step": 232488, "acc_step": 0, "speed/wps": 5527.922016901664, "speed/FLOPS": 244305858677215.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04555002972483635, "optim/lr": 2.310307704040815e-05, "optim/total_tokens": 1950250696704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2896345853805542, "created_at": "2025-06-03T05:40:25.591903+00:00"} {"global_step": 232489, "acc_step": 0, "speed/wps": 5514.230048112729, "speed/FLOPS": 243700743738593.62, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04318630322813988, "optim/lr": 2.3099529815313824e-05, "optim/total_tokens": 1950259085312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.280158519744873, "created_at": "2025-06-03T05:40:28.572026+00:00"} {"global_step": 232490, "acc_step": 0, "speed/wps": 5518.356425460083, "speed/FLOPS": 243883108496632.78, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042018018662929535, "optim/lr": 2.3095982590219278e-05, "optim/total_tokens": 1950267473920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.286267876625061, "created_at": "2025-06-03T05:40:31.545666+00:00"} {"global_step": 232491, "acc_step": 0, "speed/wps": 5516.810272800217, "speed/FLOPS": 243814776462993.44, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04255491867661476, "optim/lr": 2.309243536512473e-05, "optim/total_tokens": 1950275862528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.299900770187378, "created_at": "2025-06-03T05:40:34.520033+00:00"} {"global_step": 232492, "acc_step": 0, "speed/wps": 5520.898176731345, "speed/FLOPS": 243995440892960.2, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042294424027204514, "optim/lr": 2.3088888140030185e-05, "optim/total_tokens": 1950284251136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2951098680496216, "created_at": "2025-06-03T05:40:37.496154+00:00"} {"global_step": 232493, "acc_step": 0, "speed/wps": 5524.233544006715, "speed/FLOPS": 244142847054574.22, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04291073977947235, "optim/lr": 2.308534091493586e-05, "optim/total_tokens": 1950292639744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3027198314666748, "created_at": "2025-06-03T05:40:40.469511+00:00"} {"global_step": 232494, "acc_step": 0, "speed/wps": 5527.7374298612995, "speed/FLOPS": 244297700874833.25, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042706139385700226, "optim/lr": 2.3081793689841312e-05, "optim/total_tokens": 1950301028352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.3002841472625732, "created_at": "2025-06-03T05:40:43.438192+00:00"} {"global_step": 232495, "acc_step": 0, "speed/wps": 5522.2151908080605, "speed/FLOPS": 244053646174061.88, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04264795407652855, "optim/lr": 2.3078246464746766e-05, "optim/total_tokens": 1950309416960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2960286140441895, "created_at": "2025-06-03T05:40:46.412596+00:00"} {"global_step": 232496, "acc_step": 0, "speed/wps": 5526.568613886554, "speed/FLOPS": 244246045191291.97, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042740240693092346, "optim/lr": 2.307469923965222e-05, "optim/total_tokens": 1950317805568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2845534086227417, "created_at": "2025-06-03T05:40:49.382453+00:00"} {"global_step": 232497, "acc_step": 0, "speed/wps": 5523.903110457855, "speed/FLOPS": 244128243583026.84, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04272855445742607, "optim/lr": 2.3071152014557893e-05, "optim/total_tokens": 1950326194176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2781611680984497, "created_at": "2025-06-03T05:40:52.356850+00:00"} {"global_step": 232498, "acc_step": 0, "speed/wps": 5513.141717055974, "speed/FLOPS": 243652645076468.4, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.37 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.37, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043661318719387054, "optim/lr": 2.3067604789463347e-05, "optim/total_tokens": 1950334582784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2816393375396729, "created_at": "2025-06-03T05:40:55.336607+00:00"} {"global_step": 232499, "acc_step": 0, "speed/wps": 5513.71541249681, "speed/FLOPS": 243677999478513.9, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043657224625349045, "optim/lr": 2.30640575643688e-05, "optim/total_tokens": 1950342971392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2927969694137573, "created_at": "2025-06-03T05:40:58.314856+00:00"} {"global_step": 232500, "acc_step": 0, "speed/wps": 5515.050482150501, "speed/FLOPS": 243737002723701.06, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04295876994729042, "optim/lr": 2.3060510339274254e-05, "optim/total_tokens": 1950351360000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2835420370101929, "created_at": "2025-06-03T05:41:01.290963+00:00"} {"global_step": 232501, "acc_step": 0, "speed/wps": 5521.661342856996, "speed/FLOPS": 244029168929475.62, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04267958179116249, "optim/lr": 2.305696311417993e-05, "optim/total_tokens": 1950359748608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2895344495773315, "created_at": "2025-06-03T05:41:04.267182+00:00"} {"global_step": 232502, "acc_step": 0, "speed/wps": 5529.663598149529, "speed/FLOPS": 244382827654149.94, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04296193644404411, "optim/lr": 2.305341588908538e-05, "optim/total_tokens": 1950368137216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2922531366348267, "created_at": "2025-06-03T05:41:07.236620+00:00"} {"global_step": 232503, "acc_step": 0, "speed/wps": 5519.288303926314, "speed/FLOPS": 243924292755053.8, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04320618882775307, "optim/lr": 2.3049868663990835e-05, "optim/total_tokens": 1950376525824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3094699382781982, "created_at": "2025-06-03T05:41:10.213638+00:00"} {"global_step": 232504, "acc_step": 0, "speed/wps": 5526.87436274237, "speed/FLOPS": 244259557725754.53, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.4, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04293819144368172, "optim/lr": 2.304632143889629e-05, "optim/total_tokens": 1950384914432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.279991865158081, "created_at": "2025-06-03T05:41:13.182879+00:00"} {"global_step": 232505, "acc_step": 0, "speed/wps": 5512.968357574252, "speed/FLOPS": 243644983474710.56, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04219783842563629, "optim/lr": 2.3042774213801966e-05, "optim/total_tokens": 1950393303040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3001267910003662, "created_at": "2025-06-03T05:41:16.158709+00:00"} {"global_step": 232506, "acc_step": 0, "speed/wps": 5516.316042326818, "speed/FLOPS": 243792934005770.1, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043554164469242096, "optim/lr": 2.303922698870742e-05, "optim/total_tokens": 1950401691648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.293567419052124, "created_at": "2025-06-03T05:41:19.133106+00:00"} {"global_step": 232507, "acc_step": 0, "speed/wps": 5511.764592408295, "speed/FLOPS": 243591783215803.94, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042437683790922165, "optim/lr": 2.303567976361287e-05, "optim/total_tokens": 1950410080256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.283861756324768, "created_at": "2025-06-03T05:41:22.113222+00:00"} {"global_step": 232508, "acc_step": 0, "speed/wps": 5511.538514572216, "speed/FLOPS": 243581791732620.47, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04455672577023506, "optim/lr": 2.3032132538518323e-05, "optim/total_tokens": 1950418468864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2984987497329712, "created_at": "2025-06-03T05:41:25.092895+00:00"} {"global_step": 232509, "acc_step": 0, "speed/wps": 5506.14241019348, "speed/FLOPS": 243343311538846.38, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.36 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.36, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04519197717308998, "optim/lr": 2.3028585313424e-05, "optim/total_tokens": 1950426857472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2951956987380981, "created_at": "2025-06-03T05:41:28.076941+00:00"} {"global_step": 232510, "acc_step": 0, "speed/wps": 5524.9367067704425, "speed/FLOPS": 244173923249617.7, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04440992698073387, "optim/lr": 2.3025038088329454e-05, "optim/total_tokens": 1950435246080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2885595560073853, "created_at": "2025-06-03T05:41:31.052502+00:00"} {"global_step": 232511, "acc_step": 0, "speed/wps": 5525.887120709916, "speed/FLOPS": 244215926681082.88, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04549112543463707, "optim/lr": 2.3021490863234908e-05, "optim/total_tokens": 1950443634688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.282767653465271, "created_at": "2025-06-03T05:41:34.021802+00:00"} {"global_step": 232512, "acc_step": 0, "speed/wps": 5528.218202377073, "speed/FLOPS": 244318948559213.62, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04302283376455307, "optim/lr": 2.301794363814058e-05, "optim/total_tokens": 1950452023296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2827037572860718, "created_at": "2025-06-03T05:41:36.992572+00:00"} {"global_step": 232513, "acc_step": 0, "speed/wps": 5515.386243575104, "speed/FLOPS": 243751841660085.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044664040207862854, "optim/lr": 2.3014396413046035e-05, "optim/total_tokens": 1950460411904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2943224906921387, "created_at": "2025-06-03T05:41:39.967534+00:00"} {"global_step": 232514, "acc_step": 0, "speed/wps": 5531.137348770064, "speed/FLOPS": 244447959888238.1, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04995900020003319, "optim/lr": 2.301084918795149e-05, "optim/total_tokens": 1950468800512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2937545776367188, "created_at": "2025-06-03T05:41:42.937004+00:00"} {"global_step": 232515, "acc_step": 0, "speed/wps": 5527.537564537191, "speed/FLOPS": 244288867850511.12, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04645644128322601, "optim/lr": 2.3007301962856942e-05, "optim/total_tokens": 1950477189120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2823888063430786, "created_at": "2025-06-03T05:41:45.908682+00:00"} {"global_step": 232516, "acc_step": 0, "speed/wps": 5513.357169527509, "speed/FLOPS": 243662166972924.5, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043185800313949585, "optim/lr": 2.3003754737762616e-05, "optim/total_tokens": 1950485577728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2911332845687866, "created_at": "2025-06-03T05:41:48.889096+00:00"} {"global_step": 232517, "acc_step": 0, "speed/wps": 5521.591341430831, "speed/FLOPS": 244026075224738.88, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0461822971701622, "optim/lr": 2.300020751266807e-05, "optim/total_tokens": 1950493966336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2844429016113281, "created_at": "2025-06-03T05:41:51.861910+00:00"} {"global_step": 232518, "acc_step": 0, "speed/wps": 5516.096100282018, "speed/FLOPS": 243783213693155.34, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.35 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.35, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04659130424261093, "optim/lr": 2.2996660287573523e-05, "optim/total_tokens": 1950502354944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2869822978973389, "created_at": "2025-06-03T05:41:54.838840+00:00"} {"global_step": 232519, "acc_step": 0, "speed/wps": 5527.996689220635, "speed/FLOPS": 244309158811506.16, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05018777772784233, "optim/lr": 2.2993113062478977e-05, "optim/total_tokens": 1950510743552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2996054887771606, "created_at": "2025-06-03T05:41:57.811070+00:00"} {"global_step": 232520, "acc_step": 0, "speed/wps": 5518.003681930728, "speed/FLOPS": 243867519038140.34, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04695477336645126, "optim/lr": 2.298956583738465e-05, "optim/total_tokens": 1950519132160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2839744091033936, "created_at": "2025-06-03T05:42:00.785321+00:00"} {"global_step": 232521, "acc_step": 0, "speed/wps": 5521.448017502511, "speed/FLOPS": 244019741040705.53, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04441789910197258, "optim/lr": 2.2986018612290105e-05, "optim/total_tokens": 1950527520768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2872811555862427, "created_at": "2025-06-03T05:42:03.757511+00:00"} {"global_step": 232522, "acc_step": 0, "speed/wps": 5531.528966990157, "speed/FLOPS": 244465267409082.44, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.21, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04950268566608429, "optim/lr": 2.2982471387195558e-05, "optim/total_tokens": 1950535909376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2965117692947388, "created_at": "2025-06-03T05:42:06.728127+00:00"} {"global_step": 232523, "acc_step": 0, "speed/wps": 5522.161717544648, "speed/FLOPS": 244051282929520.03, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04295666888356209, "optim/lr": 2.2978924162101012e-05, "optim/total_tokens": 1950544297984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2771263122558594, "created_at": "2025-06-03T05:42:09.700846+00:00"} {"global_step": 232524, "acc_step": 0, "speed/wps": 5517.181978894181, "speed/FLOPS": 243831203969782.38, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04639632999897003, "optim/lr": 2.2975376937006686e-05, "optim/total_tokens": 1950552686592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2793842554092407, "created_at": "2025-06-03T05:42:12.676038+00:00"} {"global_step": 232525, "acc_step": 0, "speed/wps": 5523.583169422604, "speed/FLOPS": 244114103826875.4, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045537497848272324, "optim/lr": 2.297182971191214e-05, "optim/total_tokens": 1950561075200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3092652559280396, "created_at": "2025-06-03T05:42:15.647195+00:00"} {"global_step": 232526, "acc_step": 0, "speed/wps": 5528.285417745747, "speed/FLOPS": 244321919134469.53, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04606584832072258, "optim/lr": 2.2968282486817593e-05, "optim/total_tokens": 1950569463808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2761623859405518, "created_at": "2025-06-03T05:42:18.616334+00:00"} {"global_step": 232527, "acc_step": 0, "speed/wps": 5531.087684898728, "speed/FLOPS": 244445764999327.78, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045520808547735214, "optim/lr": 2.2964735261723046e-05, "optim/total_tokens": 1950577852416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2930395603179932, "created_at": "2025-06-03T05:42:21.584515+00:00"} {"global_step": 232528, "acc_step": 0, "speed/wps": 5514.103078947115, "speed/FLOPS": 243695132351360.6, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04388311505317688, "optim/lr": 2.296118803662872e-05, "optim/total_tokens": 1950586241024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2876557111740112, "created_at": "2025-06-03T05:42:24.561779+00:00"} {"global_step": 232529, "acc_step": 0, "speed/wps": 5519.710968875082, "speed/FLOPS": 243942972382394.0, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04329824075102806, "optim/lr": 2.2957640811534174e-05, "optim/total_tokens": 1950594629632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2953898906707764, "created_at": "2025-06-03T05:42:27.536741+00:00"} {"global_step": 232530, "acc_step": 0, "speed/wps": 5529.591885471331, "speed/FLOPS": 244379658320832.34, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04504714906215668, "optim/lr": 2.2954093586439627e-05, "optim/total_tokens": 1950603018240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3111469745635986, "created_at": "2025-06-03T05:42:30.504958+00:00"} {"global_step": 232531, "acc_step": 0, "speed/wps": 5512.292296367595, "speed/FLOPS": 243615105029771.25, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.34 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.34, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04216090217232704, "optim/lr": 2.295054636134508e-05, "optim/total_tokens": 1950611406848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.300012230873108, "created_at": "2025-06-03T05:42:33.484672+00:00"} {"global_step": 232532, "acc_step": 0, "speed/wps": 5521.092828817055, "speed/FLOPS": 244004043518828.88, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04869436100125313, "optim/lr": 2.2946999136250758e-05, "optim/total_tokens": 1950619795456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2992539405822754, "created_at": "2025-06-03T05:42:36.457315+00:00"} {"global_step": 232533, "acc_step": 0, "speed/wps": 5515.37675230053, "speed/FLOPS": 243751422194330.34, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0451672337949276, "optim/lr": 2.294345191115621e-05, "optim/total_tokens": 1950628184064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2864553928375244, "created_at": "2025-06-03T05:42:39.439482+00:00"} {"global_step": 232534, "acc_step": 0, "speed/wps": 5523.723924169787, "speed/FLOPS": 244120324466252.78, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04571127891540527, "optim/lr": 2.2939904686061662e-05, "optim/total_tokens": 1950636572672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2864969968795776, "created_at": "2025-06-03T05:42:42.410883+00:00"} {"global_step": 232535, "acc_step": 0, "speed/wps": 5531.663132981256, "speed/FLOPS": 244471196859165.22, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.27, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04833387956023216, "optim/lr": 2.2936357460967116e-05, "optim/total_tokens": 1950644961280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2872389554977417, "created_at": "2025-06-03T05:42:45.377787+00:00"} {"global_step": 232536, "acc_step": 0, "speed/wps": 5528.040951694622, "speed/FLOPS": 244311114986300.53, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04322744160890579, "optim/lr": 2.2932810235872793e-05, "optim/total_tokens": 1950653349888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2826546430587769, "created_at": "2025-06-03T05:42:48.350934+00:00"} {"global_step": 232537, "acc_step": 0, "speed/wps": 5524.421501622499, "speed/FLOPS": 244151153819137.56, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0442204549908638, "optim/lr": 2.2929263010778247e-05, "optim/total_tokens": 1950661738496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.29725182056427, "created_at": "2025-06-03T05:42:51.326863+00:00"} {"global_step": 232538, "acc_step": 0, "speed/wps": 5517.128703416007, "speed/FLOPS": 243828849466335.7, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04477942734956741, "optim/lr": 2.2925715785683697e-05, "optim/total_tokens": 1950670127104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2789602279663086, "created_at": "2025-06-03T05:42:54.302290+00:00"} {"global_step": 232539, "acc_step": 0, "speed/wps": 5535.507053991689, "speed/FLOPS": 244641078492855.03, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.08, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04185080528259277, "optim/lr": 2.2922168560589374e-05, "optim/total_tokens": 1950678515712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2902238368988037, "created_at": "2025-06-03T05:42:57.270050+00:00"} {"global_step": 232540, "acc_step": 0, "speed/wps": 5519.169406942122, "speed/FLOPS": 243919038116922.47, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043272532522678375, "optim/lr": 2.2918621335494828e-05, "optim/total_tokens": 1950686904320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2861076593399048, "created_at": "2025-06-03T05:43:00.244187+00:00"} {"global_step": 232541, "acc_step": 0, "speed/wps": 5514.496932944912, "speed/FLOPS": 243712538682135.72, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04368634521961212, "optim/lr": 2.291507411040028e-05, "optim/total_tokens": 1950695292928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2937275171279907, "created_at": "2025-06-03T05:43:03.220356+00:00"} {"global_step": 232542, "acc_step": 0, "speed/wps": 5518.4634559112055, "speed/FLOPS": 243887838694740.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04276638850569725, "optim/lr": 2.2911526885305735e-05, "optim/total_tokens": 1950703681536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2887542247772217, "created_at": "2025-06-03T05:43:06.194109+00:00"} {"global_step": 232543, "acc_step": 0, "speed/wps": 5525.075333710224, "speed/FLOPS": 244180049850799.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045220937579870224, "optim/lr": 2.290797966021141e-05, "optim/total_tokens": 1950712070144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2820264101028442, "created_at": "2025-06-03T05:43:09.164658+00:00"} {"global_step": 232544, "acc_step": 0, "speed/wps": 5526.155145999773, "speed/FLOPS": 244227772027016.75, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04351446405053139, "optim/lr": 2.2904432435116862e-05, "optim/total_tokens": 1950720458752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3061144351959229, "created_at": "2025-06-03T05:43:12.134785+00:00"} {"global_step": 232545, "acc_step": 0, "speed/wps": 5527.4838053562935, "speed/FLOPS": 244286491969879.88, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048228245228528976, "optim/lr": 2.2900885210022316e-05, "optim/total_tokens": 1950728847360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2990115880966187, "created_at": "2025-06-03T05:43:15.107049+00:00"} {"global_step": 232546, "acc_step": 0, "speed/wps": 5522.686269071866, "speed/FLOPS": 244074465422124.94, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044354479759931564, "optim/lr": 2.289733798492777e-05, "optim/total_tokens": 1950737235968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2724840641021729, "created_at": "2025-06-03T05:43:18.079087+00:00"} {"global_step": 232547, "acc_step": 0, "speed/wps": 5517.315421695192, "speed/FLOPS": 243837101458564.88, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04292970523238182, "optim/lr": 2.2893790759833443e-05, "optim/total_tokens": 1950745624576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.276555061340332, "created_at": "2025-06-03T05:43:21.053983+00:00"} {"global_step": 232548, "acc_step": 0, "speed/wps": 5521.420555138744, "speed/FLOPS": 244018527344792.16, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04289446398615837, "optim/lr": 2.2890243534738897e-05, "optim/total_tokens": 1950754013184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3037750720977783, "created_at": "2025-06-03T05:43:24.026709+00:00"} {"global_step": 232549, "acc_step": 0, "speed/wps": 5528.16542622272, "speed/FLOPS": 244316616123324.06, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045408155769109726, "optim/lr": 2.288669630964435e-05, "optim/total_tokens": 1950762401792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.3014490604400635, "created_at": "2025-06-03T05:43:26.998732+00:00"} {"global_step": 232550, "acc_step": 0, "speed/wps": 5511.746647188249, "speed/FLOPS": 243590990128929.84, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046569351106882095, "optim/lr": 2.2883149084549804e-05, "optim/total_tokens": 1950770790400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2996760606765747, "created_at": "2025-06-03T05:43:29.976701+00:00"} {"global_step": 232551, "acc_step": 0, "speed/wps": 5506.164821240559, "speed/FLOPS": 243344301992417.12, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.33 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.33, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042137812823057175, "optim/lr": 2.2879601859455478e-05, "optim/total_tokens": 1950779179008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2868070602416992, "created_at": "2025-06-03T05:43:32.957313+00:00"} {"global_step": 232552, "acc_step": 0, "speed/wps": 5530.916945787782, "speed/FLOPS": 244438219204545.97, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0460866317152977, "optim/lr": 2.287605463436093e-05, "optim/total_tokens": 1950787567616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2870023250579834, "created_at": "2025-06-03T05:43:35.924645+00:00"} {"global_step": 232553, "acc_step": 0, "speed/wps": 5527.035495857442, "speed/FLOPS": 244266678984686.66, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04199566692113876, "optim/lr": 2.2872507409266385e-05, "optim/total_tokens": 1950795956224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.290325403213501, "created_at": "2025-06-03T05:43:38.894892+00:00"} {"global_step": 232554, "acc_step": 0, "speed/wps": 5527.4469571603795, "speed/FLOPS": 244284863468226.62, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04655646160244942, "optim/lr": 2.286896018417184e-05, "optim/total_tokens": 1950804344832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2818927764892578, "created_at": "2025-06-03T05:43:41.864052+00:00"} {"global_step": 232555, "acc_step": 0, "speed/wps": 5527.414752513881, "speed/FLOPS": 244283440187689.72, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044140443205833435, "optim/lr": 2.2865412959077513e-05, "optim/total_tokens": 1950812733440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2913638353347778, "created_at": "2025-06-03T05:43:44.836415+00:00"} {"global_step": 232556, "acc_step": 0, "speed/wps": 5513.275684123215, "speed/FLOPS": 243658565735134.84, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046601369976997375, "optim/lr": 2.2861865733982966e-05, "optim/total_tokens": 1950821122048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.282736897468567, "created_at": "2025-06-03T05:43:47.815242+00:00"} {"global_step": 232557, "acc_step": 0, "speed/wps": 5512.53827948233, "speed/FLOPS": 243625976224386.84, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.32 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.32, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04748016223311424, "optim/lr": 2.285831850888842e-05, "optim/total_tokens": 1950829510656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.302366852760315, "created_at": "2025-06-03T05:43:50.792587+00:00"} {"global_step": 232558, "acc_step": 0, "speed/wps": 5519.371736903256, "speed/FLOPS": 243927980065585.94, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04560623690485954, "optim/lr": 2.2854771283793873e-05, "optim/total_tokens": 1950837899264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2816038131713867, "created_at": "2025-06-03T05:43:53.771296+00:00"} {"global_step": 232559, "acc_step": 0, "speed/wps": 5519.376717991684, "speed/FLOPS": 243928200204198.97, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.049956366419792175, "optim/lr": 2.285122405869955e-05, "optim/total_tokens": 1950846287872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.30446457862854, "created_at": "2025-06-03T05:43:56.744835+00:00"} {"global_step": 232560, "acc_step": 0, "speed/wps": 5525.749394188295, "speed/FLOPS": 244209839873775.47, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04368039593100548, "optim/lr": 2.2847676833605e-05, "optim/total_tokens": 1950854676480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2964627742767334, "created_at": "2025-06-03T05:43:59.715881+00:00"} {"global_step": 232561, "acc_step": 0, "speed/wps": 5524.25528031059, "speed/FLOPS": 244143807687949.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04801448807120323, "optim/lr": 2.2844129608510454e-05, "optim/total_tokens": 1950863065088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3074935674667358, "created_at": "2025-06-03T05:44:02.686739+00:00"} {"global_step": 232562, "acc_step": 0, "speed/wps": 5526.629374298659, "speed/FLOPS": 244248730490507.03, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044371381402015686, "optim/lr": 2.2840582383415908e-05, "optim/total_tokens": 1950871453696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2758338451385498, "created_at": "2025-06-03T05:44:05.656065+00:00"} {"global_step": 232563, "acc_step": 0, "speed/wps": 5527.548630856398, "speed/FLOPS": 244289356925177.5, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04449578747153282, "optim/lr": 2.2837035158321585e-05, "optim/total_tokens": 1950879842304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.274958610534668, "created_at": "2025-06-03T05:44:08.627232+00:00"} {"global_step": 232564, "acc_step": 0, "speed/wps": 5517.760520233374, "speed/FLOPS": 243856772535731.72, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0500456728041172, "optim/lr": 2.283348793322704e-05, "optim/total_tokens": 1950888230912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.302716612815857, "created_at": "2025-06-03T05:44:11.601578+00:00"} {"global_step": 232565, "acc_step": 0, "speed/wps": 5525.912982027588, "speed/FLOPS": 244217069618953.78, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04954409599304199, "optim/lr": 2.282994070813249e-05, "optim/total_tokens": 1950896619520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2949565649032593, "created_at": "2025-06-03T05:44:14.570935+00:00"} {"global_step": 232566, "acc_step": 0, "speed/wps": 5513.604025305838, "speed/FLOPS": 243673076734804.25, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04547816142439842, "optim/lr": 2.2826393483038166e-05, "optim/total_tokens": 1950905008128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2934269905090332, "created_at": "2025-06-03T05:44:17.547374+00:00"} {"global_step": 232567, "acc_step": 0, "speed/wps": 5510.1731646226335, "speed/FLOPS": 243521450253343.5, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04602961987257004, "optim/lr": 2.282284625794362e-05, "optim/total_tokens": 1950913396736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2908647060394287, "created_at": "2025-06-03T05:44:20.525094+00:00"} {"global_step": 232568, "acc_step": 0, "speed/wps": 5527.689693727617, "speed/FLOPS": 244295591182060.16, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044550444930791855, "optim/lr": 2.2819299032849074e-05, "optim/total_tokens": 1950921785344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2837777137756348, "created_at": "2025-06-03T05:44:23.498411+00:00"} {"global_step": 232569, "acc_step": 0, "speed/wps": 5511.428444272493, "speed/FLOPS": 243576927188763.6, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.047554709017276764, "optim/lr": 2.2815751807754527e-05, "optim/total_tokens": 1950930173952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.303436517715454, "created_at": "2025-06-03T05:44:26.477539+00:00"} {"global_step": 232570, "acc_step": 0, "speed/wps": 5514.341193547447, "speed/FLOPS": 243705655797914.25, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04450219124555588, "optim/lr": 2.28122045826602e-05, "optim/total_tokens": 1950938562560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2897628545761108, "created_at": "2025-06-03T05:44:29.453412+00:00"} {"global_step": 232571, "acc_step": 0, "speed/wps": 5521.720309518585, "speed/FLOPS": 244031774954099.12, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04342523217201233, "optim/lr": 2.2808657357565655e-05, "optim/total_tokens": 1950946951168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.300876259803772, "created_at": "2025-06-03T05:44:32.425586+00:00"} {"global_step": 232572, "acc_step": 0, "speed/wps": 5516.123604401936, "speed/FLOPS": 243784429234476.9, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044756531715393066, "optim/lr": 2.2805110132471108e-05, "optim/total_tokens": 1950955339776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2902580499649048, "created_at": "2025-06-03T05:44:35.400735+00:00"} {"global_step": 232573, "acc_step": 0, "speed/wps": 5511.288934853572, "speed/FLOPS": 243570761586521.22, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042588528245687485, "optim/lr": 2.2801562907376562e-05, "optim/total_tokens": 1950963728384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2891426086425781, "created_at": "2025-06-03T05:44:38.378195+00:00"} {"global_step": 232574, "acc_step": 0, "speed/wps": 5513.178549273148, "speed/FLOPS": 243654272871943.1, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043494813144207, "optim/lr": 2.2798015682282236e-05, "optim/total_tokens": 1950972116992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2711281776428223, "created_at": "2025-06-03T05:44:41.359099+00:00"} {"global_step": 232575, "acc_step": 0, "speed/wps": 5505.585741403028, "speed/FLOPS": 243318709627597.56, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.31 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.31, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04311584308743477, "optim/lr": 2.279446845718769e-05, "optim/total_tokens": 1950980505600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.28266179561615, "created_at": "2025-06-03T05:44:44.342417+00:00"} {"global_step": 232576, "acc_step": 0, "speed/wps": 5517.792472729414, "speed/FLOPS": 243858184672508.97, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042152199894189835, "optim/lr": 2.2790921232093143e-05, "optim/total_tokens": 1950988894208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2729636430740356, "created_at": "2025-06-03T05:44:47.320080+00:00"} {"global_step": 232577, "acc_step": 0, "speed/wps": 5531.738867868843, "speed/FLOPS": 244474543953550.28, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04358449950814247, "optim/lr": 2.2787374006998596e-05, "optim/total_tokens": 1950997282816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2989780902862549, "created_at": "2025-06-03T05:44:50.292212+00:00"} {"global_step": 232578, "acc_step": 0, "speed/wps": 5530.169911605918, "speed/FLOPS": 244405204117375.12, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.35, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043395016342401505, "optim/lr": 2.278382678190427e-05, "optim/total_tokens": 1951005671424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2935107946395874, "created_at": "2025-06-03T05:44:53.263702+00:00"} {"global_step": 232579, "acc_step": 0, "speed/wps": 5511.279776660099, "speed/FLOPS": 243570356841245.6, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04300948977470398, "optim/lr": 2.2780279556809724e-05, "optim/total_tokens": 1951014060032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2825275659561157, "created_at": "2025-06-03T05:44:56.244342+00:00"} {"global_step": 232580, "acc_step": 0, "speed/wps": 5515.406676122836, "speed/FLOPS": 243752744674112.25, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04305016249418259, "optim/lr": 2.2776732331715177e-05, "optim/total_tokens": 1951022448640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3084771633148193, "created_at": "2025-06-03T05:44:59.220499+00:00"} {"global_step": 232581, "acc_step": 0, "speed/wps": 5523.530227660342, "speed/FLOPS": 244111764071963.9, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042084019631147385, "optim/lr": 2.277318510662063e-05, "optim/total_tokens": 1951030837248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2911897897720337, "created_at": "2025-06-03T05:45:02.196457+00:00"} {"global_step": 232582, "acc_step": 0, "speed/wps": 5516.226004399335, "speed/FLOPS": 243788954790231.22, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04224706068634987, "optim/lr": 2.2769637881526305e-05, "optim/total_tokens": 1951039225856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2949113845825195, "created_at": "2025-06-03T05:45:05.174186+00:00"} {"global_step": 232583, "acc_step": 0, "speed/wps": 5513.081859705726, "speed/FLOPS": 243649999687965.12, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04295605793595314, "optim/lr": 2.276609065643176e-05, "optim/total_tokens": 1951047614464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2880020141601562, "created_at": "2025-06-03T05:45:08.150502+00:00"} {"global_step": 232584, "acc_step": 0, "speed/wps": 5513.596355022312, "speed/FLOPS": 243672737747532.5, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04446214437484741, "optim/lr": 2.2762543431337212e-05, "optim/total_tokens": 1951056003072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2836761474609375, "created_at": "2025-06-03T05:45:11.126781+00:00"} {"global_step": 232585, "acc_step": 0, "speed/wps": 5521.488870380679, "speed/FLOPS": 244021546528816.56, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04627932980656624, "optim/lr": 2.2758996206242666e-05, "optim/total_tokens": 1951064391680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2767436504364014, "created_at": "2025-06-03T05:45:14.098191+00:00"} {"global_step": 232586, "acc_step": 0, "speed/wps": 5517.752906740789, "speed/FLOPS": 243856436058328.8, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04492481052875519, "optim/lr": 2.275544898114834e-05, "optim/total_tokens": 1951072780288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2984665632247925, "created_at": "2025-06-03T05:45:17.071994+00:00"} {"global_step": 232587, "acc_step": 0, "speed/wps": 5520.56733346516, "speed/FLOPS": 243980819314004.16, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048447877168655396, "optim/lr": 2.2751901756053793e-05, "optim/total_tokens": 1951081168896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.293014645576477, "created_at": "2025-06-03T05:45:20.045774+00:00"} {"global_step": 232588, "acc_step": 0, "speed/wps": 5522.166526863153, "speed/FLOPS": 244051495476781.62, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04263515770435333, "optim/lr": 2.2748354530959247e-05, "optim/total_tokens": 1951089557504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.295074224472046, "created_at": "2025-06-03T05:45:23.020933+00:00"} {"global_step": 232589, "acc_step": 0, "speed/wps": 5522.403586639579, "speed/FLOPS": 244061972305517.7, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043117839843034744, "optim/lr": 2.27448073058647e-05, "optim/total_tokens": 1951097946112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2962533235549927, "created_at": "2025-06-03T05:45:25.992451+00:00"} {"global_step": 232590, "acc_step": 0, "speed/wps": 5506.252063936151, "speed/FLOPS": 243348157673013.7, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.3 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.3, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04482610151171684, "optim/lr": 2.2741260080770378e-05, "optim/total_tokens": 1951106334720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2902343273162842, "created_at": "2025-06-03T05:45:28.973681+00:00"} {"global_step": 232591, "acc_step": 0, "speed/wps": 5516.15292749971, "speed/FLOPS": 243785725165309.28, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046105507761240005, "optim/lr": 2.2737712855675828e-05, "optim/total_tokens": 1951114723328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2996342182159424, "created_at": "2025-06-03T05:45:31.954456+00:00"} {"global_step": 232592, "acc_step": 0, "speed/wps": 5510.898874223817, "speed/FLOPS": 243553522903197.38, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044460564851760864, "optim/lr": 2.273416563058128e-05, "optim/total_tokens": 1951123111936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.292784571647644, "created_at": "2025-06-03T05:45:34.936007+00:00"} {"global_step": 232593, "acc_step": 0, "speed/wps": 5519.685192852186, "speed/FLOPS": 243941833214115.7, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04573037847876549, "optim/lr": 2.273061840548696e-05, "optim/total_tokens": 1951131500544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2803359031677246, "created_at": "2025-06-03T05:45:37.914391+00:00"} {"global_step": 232594, "acc_step": 0, "speed/wps": 5515.850480520741, "speed/FLOPS": 243772358556902.84, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04641246423125267, "optim/lr": 2.2727071180392412e-05, "optim/total_tokens": 1951139889152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3029968738555908, "created_at": "2025-06-03T05:45:40.889861+00:00"} {"global_step": 232595, "acc_step": 0, "speed/wps": 5512.333650357944, "speed/FLOPS": 243616932664475.78, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.049875304102897644, "optim/lr": 2.2723523955297866e-05, "optim/total_tokens": 1951148277760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2898104190826416, "created_at": "2025-06-03T05:45:43.867507+00:00"} {"global_step": 232596, "acc_step": 0, "speed/wps": 5516.248016320324, "speed/FLOPS": 243789927604471.7, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044804271310567856, "optim/lr": 2.2719976730203316e-05, "optim/total_tokens": 1951156666368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2928024530410767, "created_at": "2025-06-03T05:45:46.842857+00:00"} {"global_step": 232597, "acc_step": 0, "speed/wps": 5518.965050502267, "speed/FLOPS": 243910006608271.97, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.050702355802059174, "optim/lr": 2.2716429505108993e-05, "optim/total_tokens": 1951165054976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2873746156692505, "created_at": "2025-06-03T05:45:49.816494+00:00"} {"global_step": 232598, "acc_step": 0, "speed/wps": 5522.349770391635, "speed/FLOPS": 244059593902815.1, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044488005340099335, "optim/lr": 2.2712882280014447e-05, "optim/total_tokens": 1951173443584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2902448177337646, "created_at": "2025-06-03T05:45:52.787916+00:00"} {"global_step": 232599, "acc_step": 0, "speed/wps": 5514.297387849855, "speed/FLOPS": 243703719810298.6, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.050998758524656296, "optim/lr": 2.27093350549199e-05, "optim/total_tokens": 1951181832192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2895928621292114, "created_at": "2025-06-03T05:45:55.764104+00:00"} {"global_step": 232600, "acc_step": 0, "speed/wps": 5507.901735647626, "speed/FLOPS": 243421064718875.62, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04474534094333649, "optim/lr": 2.2705787829825354e-05, "optim/total_tokens": 1951190220800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.283874273300171, "created_at": "2025-06-03T05:45:58.746383+00:00"} {"global_step": 232601, "acc_step": 0, "speed/wps": 5515.120626450014, "speed/FLOPS": 243740102742708.5, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.049823928624391556, "optim/lr": 2.2702240604731028e-05, "optim/total_tokens": 1951198609408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.29472815990448, "created_at": "2025-06-03T05:46:01.723009+00:00"} {"global_step": 232602, "acc_step": 0, "speed/wps": 5532.306246680868, "speed/FLOPS": 244499619192933.75, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.29, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04255853220820427, "optim/lr": 2.269869337963648e-05, "optim/total_tokens": 1951206998016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2951620817184448, "created_at": "2025-06-03T05:46:04.689612+00:00"} {"global_step": 232603, "acc_step": 0, "speed/wps": 5524.4081361867975, "speed/FLOPS": 244150563135290.06, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04619544371962547, "optim/lr": 2.2695146154541935e-05, "optim/total_tokens": 1951215386624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3065803050994873, "created_at": "2025-06-03T05:46:07.660477+00:00"} {"global_step": 232604, "acc_step": 0, "speed/wps": 5523.936294957736, "speed/FLOPS": 244129710168067.9, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04450279474258423, "optim/lr": 2.269159892944739e-05, "optim/total_tokens": 1951223775232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.289304256439209, "created_at": "2025-06-03T05:46:10.634859+00:00"} {"global_step": 232605, "acc_step": 0, "speed/wps": 5527.865687325236, "speed/FLOPS": 244303369198258.0, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04646177962422371, "optim/lr": 2.2688051704353063e-05, "optim/total_tokens": 1951232163840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2907330989837646, "created_at": "2025-06-03T05:46:13.603222+00:00"} {"global_step": 232606, "acc_step": 0, "speed/wps": 5522.153610018116, "speed/FLOPS": 244050924618345.38, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04979430139064789, "optim/lr": 2.2684504479258516e-05, "optim/total_tokens": 1951240552448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.302418828010559, "created_at": "2025-06-03T05:46:16.574430+00:00"} {"global_step": 232607, "acc_step": 0, "speed/wps": 5522.2802334147145, "speed/FLOPS": 244056520724357.75, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.050527870655059814, "optim/lr": 2.268095725416397e-05, "optim/total_tokens": 1951248941056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2667559385299683, "created_at": "2025-06-03T05:46:19.549452+00:00"} {"global_step": 232608, "acc_step": 0, "speed/wps": 5516.971704149418, "speed/FLOPS": 243821910902347.56, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05221297964453697, "optim/lr": 2.2677410029069423e-05, "optim/total_tokens": 1951257329664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.295387625694275, "created_at": "2025-06-03T05:46:22.527288+00:00"} {"global_step": 232609, "acc_step": 0, "speed/wps": 5520.477493212526, "speed/FLOPS": 243976848834681.8, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.049532223492860794, "optim/lr": 2.2673862803975097e-05, "optim/total_tokens": 1951265718272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.290639877319336, "created_at": "2025-06-03T05:46:25.502898+00:00"} {"global_step": 232610, "acc_step": 0, "speed/wps": 5507.4343627617545, "speed/FLOPS": 243400409229551.4, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.28 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.28, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05010635405778885, "optim/lr": 2.267031557888055e-05, "optim/total_tokens": 1951274106880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2854154109954834, "created_at": "2025-06-03T05:46:28.482006+00:00"} {"global_step": 232611, "acc_step": 0, "speed/wps": 5525.013204562927, "speed/FLOPS": 244177304060494.28, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046196017414331436, "optim/lr": 2.2666768353786004e-05, "optim/total_tokens": 1951282495488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2957590818405151, "created_at": "2025-06-03T05:46:31.452086+00:00"} {"global_step": 232612, "acc_step": 0, "speed/wps": 5515.435195312167, "speed/FLOPS": 243754005076306.22, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.052313633263111115, "optim/lr": 2.2663221128691458e-05, "optim/total_tokens": 1951290884096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.278656244277954, "created_at": "2025-06-03T05:46:34.432545+00:00"} {"global_step": 232613, "acc_step": 0, "speed/wps": 5524.876486317342, "speed/FLOPS": 244171261813826.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04970560222864151, "optim/lr": 2.2659673903597132e-05, "optim/total_tokens": 1951299272704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2863166332244873, "created_at": "2025-06-03T05:46:37.405744+00:00"} {"global_step": 232614, "acc_step": 0, "speed/wps": 5525.116499269489, "speed/FLOPS": 244181869157814.12, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04860924929380417, "optim/lr": 2.2656126678502586e-05, "optim/total_tokens": 1951307661312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2956300973892212, "created_at": "2025-06-03T05:46:40.379809+00:00"} {"global_step": 232615, "acc_step": 0, "speed/wps": 5519.34357526422, "speed/FLOPS": 243926735465284.9, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04432705417275429, "optim/lr": 2.265257945340804e-05, "optim/total_tokens": 1951316049920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2736610174179077, "created_at": "2025-06-03T05:46:43.354354+00:00"} {"global_step": 232616, "acc_step": 0, "speed/wps": 5513.29693428579, "speed/FLOPS": 243659504883552.44, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0540936253964901, "optim/lr": 2.2649032228313493e-05, "optim/total_tokens": 1951324438528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2771004438400269, "created_at": "2025-06-03T05:46:46.331800+00:00"} {"global_step": 232617, "acc_step": 0, "speed/wps": 5511.950923600648, "speed/FLOPS": 243600018100776.4, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.26373183727264404, "optim/lr": 2.264548500321917e-05, "optim/total_tokens": 1951332827136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.3056983947753906, "created_at": "2025-06-03T05:46:49.310398+00:00"} {"global_step": 232618, "acc_step": 0, "speed/wps": 5487.728123690743, "speed/FLOPS": 242529494328287.94, "speed/curr_iter_time": 2.9848, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9848, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "5.29 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 5.29, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048421479761600494, "optim/lr": 2.264193777812462e-05, "optim/total_tokens": 1951341215744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2857277393341064, "created_at": "2025-06-03T05:46:52.300942+00:00"} {"global_step": 232619, "acc_step": 0, "speed/wps": 5518.468625346483, "speed/FLOPS": 243888067157320.6, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0458090677857399, "optim/lr": 2.2638390553030074e-05, "optim/total_tokens": 1951349604352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2708343267440796, "created_at": "2025-06-03T05:46:55.275098+00:00"} {"global_step": 232620, "acc_step": 0, "speed/wps": 5521.150620218724, "speed/FLOPS": 244006597602979.44, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.053724516183137894, "optim/lr": 2.263484332793575e-05, "optim/total_tokens": 1951357992960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2918798923492432, "created_at": "2025-06-03T05:46:58.247592+00:00"} {"global_step": 232621, "acc_step": 0, "speed/wps": 5514.277345508223, "speed/FLOPS": 243702834041384.47, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05341332405805588, "optim/lr": 2.2631296102841205e-05, "optim/total_tokens": 1951366381568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.287738561630249, "created_at": "2025-06-03T05:47:01.223363+00:00"} {"global_step": 232622, "acc_step": 0, "speed/wps": 5524.511160616623, "speed/FLOPS": 244155116287761.53, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05726117640733719, "optim/lr": 2.2627748877746658e-05, "optim/total_tokens": 1951374770176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2927578687667847, "created_at": "2025-06-03T05:47:04.195146+00:00"} {"global_step": 232623, "acc_step": 0, "speed/wps": 5517.118148970412, "speed/FLOPS": 243828383013862.97, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05506715551018715, "optim/lr": 2.262420165265211e-05, "optim/total_tokens": 1951383158784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2762848138809204, "created_at": "2025-06-03T05:47:07.171907+00:00"} {"global_step": 232624, "acc_step": 0, "speed/wps": 5511.414059448968, "speed/FLOPS": 243576291453192.0, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05301721394062042, "optim/lr": 2.2620654427557786e-05, "optim/total_tokens": 1951391547392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2919796705245972, "created_at": "2025-06-03T05:47:10.151976+00:00"} {"global_step": 232625, "acc_step": 0, "speed/wps": 5516.558861354468, "speed/FLOPS": 243803665363931.75, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05498047545552254, "optim/lr": 2.261710720246324e-05, "optim/total_tokens": 1951399936000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2884633541107178, "created_at": "2025-06-03T05:47:13.127054+00:00"} {"global_step": 232626, "acc_step": 0, "speed/wps": 5506.424183454255, "speed/FLOPS": 243355764474726.34, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.27 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.27, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044396333396434784, "optim/lr": 2.2613559977368693e-05, "optim/total_tokens": 1951408324608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.277150273323059, "created_at": "2025-06-03T05:47:16.112096+00:00"} {"global_step": 232627, "acc_step": 0, "speed/wps": 5519.957095820337, "speed/FLOPS": 243953849933582.38, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05339767038822174, "optim/lr": 2.2610012752274146e-05, "optim/total_tokens": 1951416713216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2926644086837769, "created_at": "2025-06-03T05:47:19.085799+00:00"} {"global_step": 232628, "acc_step": 0, "speed/wps": 5523.891067906305, "speed/FLOPS": 244127711363887.66, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04496503248810768, "optim/lr": 2.260646552717982e-05, "optim/total_tokens": 1951425101824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2840900421142578, "created_at": "2025-06-03T05:47:22.061803+00:00"} {"global_step": 232629, "acc_step": 0, "speed/wps": 5520.820012644473, "speed/FLOPS": 243991986440400.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04620538279414177, "optim/lr": 2.2602918302085274e-05, "optim/total_tokens": 1951433490432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3027230501174927, "created_at": "2025-06-03T05:47:25.034009+00:00"} {"global_step": 232630, "acc_step": 0, "speed/wps": 5516.0287944365755, "speed/FLOPS": 243780239119289.34, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.047298043966293335, "optim/lr": 2.2599371076990728e-05, "optim/total_tokens": 1951441879040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2975547313690186, "created_at": "2025-06-03T05:47:28.012050+00:00"} {"global_step": 232631, "acc_step": 0, "speed/wps": 5517.943289300698, "speed/FLOPS": 243864849993010.53, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0452517531812191, "optim/lr": 2.259582385189618e-05, "optim/total_tokens": 1951450267648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2860788106918335, "created_at": "2025-06-03T05:47:30.985892+00:00"} {"global_step": 232632, "acc_step": 0, "speed/wps": 5516.05178025812, "speed/FLOPS": 243781254974949.5, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04723657667636871, "optim/lr": 2.2592276626801855e-05, "optim/total_tokens": 1951458656256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.3008480072021484, "created_at": "2025-06-03T05:47:33.961646+00:00"} {"global_step": 232633, "acc_step": 0, "speed/wps": 5513.495638900217, "speed/FLOPS": 243668286610447.75, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043636348098516464, "optim/lr": 2.258872940170731e-05, "optim/total_tokens": 1951467044864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3014060258865356, "created_at": "2025-06-03T05:47:36.937569+00:00"} {"global_step": 232634, "acc_step": 0, "speed/wps": 5503.018008498156, "speed/FLOPS": 243205228976050.62, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.26 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.26, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05614173039793968, "optim/lr": 2.2585182176612762e-05, "optim/total_tokens": 1951475433472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2948909997940063, "created_at": "2025-06-03T05:47:39.919772+00:00"} {"global_step": 232635, "acc_step": 0, "speed/wps": 5514.804203908185, "speed/FLOPS": 243726118485957.0, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043591588735580444, "optim/lr": 2.2581634951518216e-05, "optim/total_tokens": 1951483822080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2862725257873535, "created_at": "2025-06-03T05:47:42.895500+00:00"} {"global_step": 232636, "acc_step": 0, "speed/wps": 5532.132867195376, "speed/FLOPS": 244491956707111.66, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05099029466509819, "optim/lr": 2.257808772642389e-05, "optim/total_tokens": 1951492210688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2843101024627686, "created_at": "2025-06-03T05:47:45.862062+00:00"} {"global_step": 232637, "acc_step": 0, "speed/wps": 5528.660438839224, "speed/FLOPS": 244338493147269.28, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04318736866116524, "optim/lr": 2.2574540501329343e-05, "optim/total_tokens": 1951500599296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2898145914077759, "created_at": "2025-06-03T05:47:48.830232+00:00"} {"global_step": 232638, "acc_step": 0, "speed/wps": 5528.937200379291, "speed/FLOPS": 244350724590746.28, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04703139513731003, "optim/lr": 2.2570993276234797e-05, "optim/total_tokens": 1951508987904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2972028255462646, "created_at": "2025-06-03T05:47:51.798753+00:00"} {"global_step": 232639, "acc_step": 0, "speed/wps": 5527.299232384116, "speed/FLOPS": 244278334789239.75, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04553007334470749, "optim/lr": 2.256744605114025e-05, "optim/total_tokens": 1951517376512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2902319431304932, "created_at": "2025-06-03T05:47:54.771238+00:00"} {"global_step": 232640, "acc_step": 0, "speed/wps": 5514.851912238165, "speed/FLOPS": 243728226949948.78, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0464087650179863, "optim/lr": 2.2563898826045924e-05, "optim/total_tokens": 1951525765120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2908815145492554, "created_at": "2025-06-03T05:47:57.747001+00:00"} {"global_step": 232641, "acc_step": 0, "speed/wps": 5515.920006560351, "speed/FLOPS": 243775431251987.06, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.25 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.25, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04687012732028961, "optim/lr": 2.2560351600951378e-05, "optim/total_tokens": 1951534153728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.285129189491272, "created_at": "2025-06-03T05:48:00.726612+00:00"} {"global_step": 232642, "acc_step": 0, "speed/wps": 5525.0101415219215, "speed/FLOPS": 244177168689759.9, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04634883254766464, "optim/lr": 2.255680437585683e-05, "optim/total_tokens": 1951542542336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.266931414604187, "created_at": "2025-06-03T05:48:03.696898+00:00"} {"global_step": 232643, "acc_step": 0, "speed/wps": 5523.946309185645, "speed/FLOPS": 244130152745684.0, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04456116631627083, "optim/lr": 2.2553257150762285e-05, "optim/total_tokens": 1951550930944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2813078165054321, "created_at": "2025-06-03T05:48:06.669706+00:00"} {"global_step": 232644, "acc_step": 0, "speed/wps": 5523.296871885461, "speed/FLOPS": 244101450941137.3, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04310370609164238, "optim/lr": 2.254970992566796e-05, "optim/total_tokens": 1951559319552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2956304550170898, "created_at": "2025-06-03T05:48:09.644652+00:00"} {"global_step": 232645, "acc_step": 0, "speed/wps": 5524.127046786377, "speed/FLOPS": 244138140422537.47, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045115113258361816, "optim/lr": 2.2546162700573413e-05, "optim/total_tokens": 1951567708160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2906651496887207, "created_at": "2025-06-03T05:48:12.615427+00:00"} {"global_step": 232646, "acc_step": 0, "speed/wps": 5522.052357861598, "speed/FLOPS": 244046449791282.78, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04313857853412628, "optim/lr": 2.2542615475478866e-05, "optim/total_tokens": 1951576096768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.287190556526184, "created_at": "2025-06-03T05:48:15.587936+00:00"} {"global_step": 232647, "acc_step": 0, "speed/wps": 5525.503020312814, "speed/FLOPS": 244198951409535.03, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0437619686126709, "optim/lr": 2.253906825038432e-05, "optim/total_tokens": 1951584485376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2871019840240479, "created_at": "2025-06-03T05:48:18.561660+00:00"} {"global_step": 232648, "acc_step": 0, "speed/wps": 5526.607571996898, "speed/FLOPS": 244247766940363.47, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04340002313256264, "optim/lr": 2.2535521025289997e-05, "optim/total_tokens": 1951592873984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2874594926834106, "created_at": "2025-06-03T05:48:21.530994+00:00"} {"global_step": 232649, "acc_step": 0, "speed/wps": 5524.300032369192, "speed/FLOPS": 244145785499877.4, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04387470707297325, "optim/lr": 2.2531973800195447e-05, "optim/total_tokens": 1951601262592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.29727303981781, "created_at": "2025-06-03T05:48:24.503524+00:00"} {"global_step": 232650, "acc_step": 0, "speed/wps": 5510.855156000065, "speed/FLOPS": 243551590781477.7, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04297778755426407, "optim/lr": 2.25284265751009e-05, "optim/total_tokens": 1951609651200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2948788404464722, "created_at": "2025-06-03T05:48:27.481337+00:00"} {"global_step": 232651, "acc_step": 0, "speed/wps": 5512.90279386321, "speed/FLOPS": 243642085894268.0, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.24 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.24, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04287136718630791, "optim/lr": 2.2524879350006578e-05, "optim/total_tokens": 1951618039808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2974236011505127, "created_at": "2025-06-03T05:48:30.458747+00:00"} {"global_step": 232652, "acc_step": 0, "speed/wps": 5529.051883630869, "speed/FLOPS": 244355793003463.94, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043245647102594376, "optim/lr": 2.252133212491203e-05, "optim/total_tokens": 1951626428416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2733478546142578, "created_at": "2025-06-03T05:48:33.431657+00:00"} {"global_step": 232653, "acc_step": 0, "speed/wps": 5531.085265071839, "speed/FLOPS": 244445658055365.06, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04584250599145889, "optim/lr": 2.2517784899817485e-05, "optim/total_tokens": 1951634817024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2900309562683105, "created_at": "2025-06-03T05:48:36.399837+00:00"} {"global_step": 232654, "acc_step": 0, "speed/wps": 5514.210092249004, "speed/FLOPS": 243699861791560.38, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04271690547466278, "optim/lr": 2.251423767472294e-05, "optim/total_tokens": 1951643205632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2898321151733398, "created_at": "2025-06-03T05:48:39.378735+00:00"} {"global_step": 232655, "acc_step": 0, "speed/wps": 5529.057052069901, "speed/FLOPS": 244356021422014.66, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04267330467700958, "optim/lr": 2.2510690449628613e-05, "optim/total_tokens": 1951651594240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2857224941253662, "created_at": "2025-06-03T05:48:42.349885+00:00"} {"global_step": 232656, "acc_step": 0, "speed/wps": 5518.231197053699, "speed/FLOPS": 243877574042047.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046330709010362625, "optim/lr": 2.2507143224534066e-05, "optim/total_tokens": 1951659982848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2781126499176025, "created_at": "2025-06-03T05:48:45.323817+00:00"} {"global_step": 232657, "acc_step": 0, "speed/wps": 5521.145704805223, "speed/FLOPS": 244006380366862.06, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.050197500735521317, "optim/lr": 2.250359599943952e-05, "optim/total_tokens": 1951668371456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2967188358306885, "created_at": "2025-06-03T05:48:48.297541+00:00"} {"global_step": 232658, "acc_step": 0, "speed/wps": 5513.463473933736, "speed/FLOPS": 243666865083564.5, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04308366775512695, "optim/lr": 2.2500048774344973e-05, "optim/total_tokens": 1951676760064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2766038179397583, "created_at": "2025-06-03T05:48:51.277240+00:00"} {"global_step": 232659, "acc_step": 0, "speed/wps": 5521.221788346893, "speed/FLOPS": 244009742869973.0, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04343800991773605, "optim/lr": 2.2496501549250647e-05, "optim/total_tokens": 1951685148672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.292854905128479, "created_at": "2025-06-03T05:48:54.249550+00:00"} {"global_step": 232660, "acc_step": 0, "speed/wps": 5531.1767095671685, "speed/FLOPS": 244449699434003.28, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042973700910806656, "optim/lr": 2.24929543241561e-05, "optim/total_tokens": 1951693537280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2827686071395874, "created_at": "2025-06-03T05:48:57.216448+00:00"} {"global_step": 232661, "acc_step": 0, "speed/wps": 5535.935233122711, "speed/FLOPS": 244660001818826.75, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.22, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042456597089767456, "optim/lr": 2.2489407099061555e-05, "optim/total_tokens": 1951701925888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2961924076080322, "created_at": "2025-06-03T05:49:00.180860+00:00"} {"global_step": 232662, "acc_step": 0, "speed/wps": 5535.495090119109, "speed/FLOPS": 244640549750923.66, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04543242231011391, "optim/lr": 2.2485859873967008e-05, "optim/total_tokens": 1951710314496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2970762252807617, "created_at": "2025-06-03T05:49:03.145725+00:00"} {"global_step": 232663, "acc_step": 0, "speed/wps": 5533.483919226086, "speed/FLOPS": 244551666291557.88, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04467116296291351, "optim/lr": 2.2482312648872682e-05, "optim/total_tokens": 1951718703104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2756750583648682, "created_at": "2025-06-03T05:49:06.111007+00:00"} {"global_step": 232664, "acc_step": 0, "speed/wps": 5527.775510804082, "speed/FLOPS": 244299383857588.28, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04323147237300873, "optim/lr": 2.2478765423778136e-05, "optim/total_tokens": 1951727091712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2911064624786377, "created_at": "2025-06-03T05:49:09.079838+00:00"} {"global_step": 232665, "acc_step": 0, "speed/wps": 5526.848742024593, "speed/FLOPS": 244258425421167.5, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04522234573960304, "optim/lr": 2.247521819868359e-05, "optim/total_tokens": 1951735480320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2844657897949219, "created_at": "2025-06-03T05:49:12.048953+00:00"} {"global_step": 232666, "acc_step": 0, "speed/wps": 5523.638540254845, "speed/FLOPS": 244116550934246.84, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04281024634838104, "optim/lr": 2.2471670973589043e-05, "optim/total_tokens": 1951743868928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2874414920806885, "created_at": "2025-06-03T05:49:15.022307+00:00"} {"global_step": 232667, "acc_step": 0, "speed/wps": 5523.612210279133, "speed/FLOPS": 244115387284089.4, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043272338807582855, "optim/lr": 2.2468123748494717e-05, "optim/total_tokens": 1951752257536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2914302349090576, "created_at": "2025-06-03T05:49:17.993047+00:00"} {"global_step": 232668, "acc_step": 0, "speed/wps": 5513.15421555879, "speed/FLOPS": 243653197446319.75, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04323623701930046, "optim/lr": 2.246457652340017e-05, "optim/total_tokens": 1951760646144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3010224103927612, "created_at": "2025-06-03T05:49:20.969901+00:00"} {"global_step": 232669, "acc_step": 0, "speed/wps": 5511.474768973638, "speed/FLOPS": 243578974503442.88, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04335981234908104, "optim/lr": 2.2461029298305624e-05, "optim/total_tokens": 1951769034752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2934563159942627, "created_at": "2025-06-03T05:49:23.951431+00:00"} {"global_step": 232670, "acc_step": 0, "speed/wps": 5522.520180334307, "speed/FLOPS": 244067125150044.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042476680129766464, "optim/lr": 2.2457482073211077e-05, "optim/total_tokens": 1951777423360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2908083200454712, "created_at": "2025-06-03T05:49:26.926517+00:00"} {"global_step": 232671, "acc_step": 0, "speed/wps": 5527.172748168914, "speed/FLOPS": 244272744834332.72, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04384327679872513, "optim/lr": 2.245393484811675e-05, "optim/total_tokens": 1951785811968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2659969329833984, "created_at": "2025-06-03T05:49:29.901048+00:00"} {"global_step": 232672, "acc_step": 0, "speed/wps": 5508.831006958618, "speed/FLOPS": 243462133754379.72, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.23 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.23, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04287673532962799, "optim/lr": 2.2450387623022205e-05, "optim/total_tokens": 1951794200576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3049736022949219, "created_at": "2025-06-03T05:49:32.884902+00:00"} {"global_step": 232673, "acc_step": 0, "speed/wps": 5528.335499067941, "speed/FLOPS": 244324132472571.1, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046662379056215286, "optim/lr": 2.244684039792766e-05, "optim/total_tokens": 1951802589184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2863080501556396, "created_at": "2025-06-03T05:49:35.857860+00:00"} {"global_step": 232674, "acc_step": 0, "speed/wps": 5520.824358332354, "speed/FLOPS": 243992178497561.6, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04375047981739044, "optim/lr": 2.2443293172833112e-05, "optim/total_tokens": 1951810977792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2948122024536133, "created_at": "2025-06-03T05:49:38.830264+00:00"} {"global_step": 232675, "acc_step": 0, "speed/wps": 5521.259361956348, "speed/FLOPS": 244011403431191.72, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044580910354852676, "optim/lr": 2.243974594773879e-05, "optim/total_tokens": 1951819366400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.309403657913208, "created_at": "2025-06-03T05:49:41.806679+00:00"} {"global_step": 232676, "acc_step": 0, "speed/wps": 5511.580952883839, "speed/FLOPS": 243583667288775.25, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04268423840403557, "optim/lr": 2.243619872264424e-05, "optim/total_tokens": 1951827755008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2820497751235962, "created_at": "2025-06-03T05:49:44.785765+00:00"} {"global_step": 232677, "acc_step": 0, "speed/wps": 5520.645566624914, "speed/FLOPS": 243984276819231.66, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05370178073644638, "optim/lr": 2.2432651497549693e-05, "optim/total_tokens": 1951836143616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.293694257736206, "created_at": "2025-06-03T05:49:47.758583+00:00"} {"global_step": 232678, "acc_step": 0, "speed/wps": 5533.358657711677, "speed/FLOPS": 244546130373767.53, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048102006316185, "optim/lr": 2.242910427245537e-05, "optim/total_tokens": 1951844532224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2884063720703125, "created_at": "2025-06-03T05:49:50.724453+00:00"} {"global_step": 232679, "acc_step": 0, "speed/wps": 5526.3160627114175, "speed/FLOPS": 244234883722025.03, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04737503454089165, "optim/lr": 2.2425557047360824e-05, "optim/total_tokens": 1951852920832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2826123237609863, "created_at": "2025-06-03T05:49:53.693955+00:00"} {"global_step": 232680, "acc_step": 0, "speed/wps": 5528.26550681663, "speed/FLOPS": 244321039173315.94, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04883942753076553, "optim/lr": 2.2422009822266278e-05, "optim/total_tokens": 1951861309440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.290951132774353, "created_at": "2025-06-03T05:49:56.662135+00:00"} {"global_step": 232681, "acc_step": 0, "speed/wps": 5526.337036367216, "speed/FLOPS": 244235810650258.4, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04276270419359207, "optim/lr": 2.2418462597171728e-05, "optim/total_tokens": 1951869698048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2714533805847168, "created_at": "2025-06-03T05:49:59.631541+00:00"} {"global_step": 232682, "acc_step": 0, "speed/wps": 5526.32774997351, "speed/FLOPS": 244235400239188.72, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.57, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0463540144264698, "optim/lr": 2.2414915372077405e-05, "optim/total_tokens": 1951878086656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.290073275566101, "created_at": "2025-06-03T05:50:02.603065+00:00"} {"global_step": 232683, "acc_step": 0, "speed/wps": 5509.658672935173, "speed/FLOPS": 243498712354164.94, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.22 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.22, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044164299964904785, "optim/lr": 2.241136814698286e-05, "optim/total_tokens": 1951886475264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2839024066925049, "created_at": "2025-06-03T05:50:05.585398+00:00"} {"global_step": 232684, "acc_step": 0, "speed/wps": 5516.806620686989, "speed/FLOPS": 243814615058281.97, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.049225322902202606, "optim/lr": 2.2407820921888312e-05, "optim/total_tokens": 1951894863872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2848231792449951, "created_at": "2025-06-03T05:50:08.560754+00:00"} {"global_step": 232685, "acc_step": 0, "speed/wps": 5524.5259586964985, "speed/FLOPS": 244155770287148.6, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04261593893170357, "optim/lr": 2.2404273696793766e-05, "optim/total_tokens": 1951903252480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2819139957427979, "created_at": "2025-06-03T05:50:11.531889+00:00"} {"global_step": 232686, "acc_step": 0, "speed/wps": 5529.81658573514, "speed/FLOPS": 244389588922372.47, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04430709034204483, "optim/lr": 2.240072647169944e-05, "optim/total_tokens": 1951911641088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2870486974716187, "created_at": "2025-06-03T05:50:14.499573+00:00"} {"global_step": 232687, "acc_step": 0, "speed/wps": 5525.710759287073, "speed/FLOPS": 244208132408892.8, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04333614557981491, "optim/lr": 2.2397179246604893e-05, "optim/total_tokens": 1951920029696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2994639873504639, "created_at": "2025-06-03T05:50:17.469234+00:00"} {"global_step": 232688, "acc_step": 0, "speed/wps": 5519.175650379261, "speed/FLOPS": 243919314044887.22, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045799240469932556, "optim/lr": 2.2393632021510347e-05, "optim/total_tokens": 1951928418304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2896652221679688, "created_at": "2025-06-03T05:50:20.447162+00:00"} {"global_step": 232689, "acc_step": 0, "speed/wps": 5530.189501605343, "speed/FLOPS": 244406069895079.03, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.44, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045145031064748764, "optim/lr": 2.23900847964158e-05, "optim/total_tokens": 1951936806912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.3047025203704834, "created_at": "2025-06-03T05:50:23.414666+00:00"} {"global_step": 232690, "acc_step": 0, "speed/wps": 5529.55802293219, "speed/FLOPS": 244378161769926.53, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0427434928715229, "optim/lr": 2.2386537571321474e-05, "optim/total_tokens": 1951945195520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.27768075466156, "created_at": "2025-06-03T05:50:26.382082+00:00"} {"global_step": 232691, "acc_step": 0, "speed/wps": 5510.771124079862, "speed/FLOPS": 243547877000719.03, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.21 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.21, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04374358803033829, "optim/lr": 2.2382990346226928e-05, "optim/total_tokens": 1951953584128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2847793102264404, "created_at": "2025-06-03T05:50:29.363537+00:00"} {"global_step": 232692, "acc_step": 0, "speed/wps": 5518.297010032091, "speed/FLOPS": 243880482638831.25, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044615842401981354, "optim/lr": 2.237944312113238e-05, "optim/total_tokens": 1951961972736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2920349836349487, "created_at": "2025-06-03T05:50:32.337046+00:00"} {"global_step": 232693, "acc_step": 0, "speed/wps": 5519.117351433385, "speed/FLOPS": 243916737529880.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04643460735678673, "optim/lr": 2.2375895896037835e-05, "optim/total_tokens": 1951970361344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2929537296295166, "created_at": "2025-06-03T05:50:35.310208+00:00"} {"global_step": 232694, "acc_step": 0, "speed/wps": 5528.353837820704, "speed/FLOPS": 244324942951576.97, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04260906204581261, "optim/lr": 2.237234867094351e-05, "optim/total_tokens": 1951978749952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.289538860321045, "created_at": "2025-06-03T05:50:38.282262+00:00"} {"global_step": 232695, "acc_step": 0, "speed/wps": 5536.176201792932, "speed/FLOPS": 244670651400661.06, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.24, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045236267149448395, "optim/lr": 2.2368801445848963e-05, "optim/total_tokens": 1951987138560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2879961729049683, "created_at": "2025-06-03T05:50:41.249060+00:00"} {"global_step": 232696, "acc_step": 0, "speed/wps": 5530.833449444972, "speed/FLOPS": 244434529093566.78, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.42, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.0426880419254303, "optim/lr": 2.2365254220754416e-05, "optim/total_tokens": 1951995527168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.296189785003662, "created_at": "2025-06-03T05:50:44.215906+00:00"} {"global_step": 232697, "acc_step": 0, "speed/wps": 5523.479466400521, "speed/FLOPS": 244109520684099.53, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04738886281847954, "optim/lr": 2.236170699565987e-05, "optim/total_tokens": 1952003915776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2915984392166138, "created_at": "2025-06-03T05:50:47.186861+00:00"} {"global_step": 232698, "acc_step": 0, "speed/wps": 5524.877523909315, "speed/FLOPS": 244171307670081.2, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04274367168545723, "optim/lr": 2.2358159770565544e-05, "optim/total_tokens": 1952012304384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.296802043914795, "created_at": "2025-06-03T05:50:50.161393+00:00"} {"global_step": 232699, "acc_step": 0, "speed/wps": 5529.67048499009, "speed/FLOPS": 244383132017252.7, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04251299053430557, "optim/lr": 2.2354612545470997e-05, "optim/total_tokens": 1952020692992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.3077841997146606, "created_at": "2025-06-03T05:50:53.128872+00:00"} {"global_step": 232700, "acc_step": 0, "speed/wps": 5523.0334278605405, "speed/FLOPS": 244089808063664.6, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043604642152786255, "optim/lr": 2.235106532037645e-05, "optim/total_tokens": 1952029081600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2975409030914307, "created_at": "2025-06-03T05:50:56.100333+00:00"} {"global_step": 232701, "acc_step": 0, "speed/wps": 5521.695779026407, "speed/FLOPS": 244030690831903.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04312066733837128, "optim/lr": 2.2347518095281904e-05, "optim/total_tokens": 1952037470208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.286500334739685, "created_at": "2025-06-03T05:50:59.076119+00:00"} {"global_step": 232702, "acc_step": 0, "speed/wps": 5524.322922808548, "speed/FLOPS": 244146797140133.06, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04335977882146835, "optim/lr": 2.2343970870187578e-05, "optim/total_tokens": 1952045858816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2848492860794067, "created_at": "2025-06-03T05:51:02.046656+00:00"} {"global_step": 232703, "acc_step": 0, "speed/wps": 5527.310532628578, "speed/FLOPS": 244278834202205.06, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04293635115027428, "optim/lr": 2.2340423645093032e-05, "optim/total_tokens": 1952054247424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2913379669189453, "created_at": "2025-06-03T05:51:05.020342+00:00"} {"global_step": 232704, "acc_step": 0, "speed/wps": 5517.0892823354125, "speed/FLOPS": 243827107256348.8, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042733319103717804, "optim/lr": 2.2336876419998485e-05, "optim/total_tokens": 1952062636032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.286374568939209, "created_at": "2025-06-03T05:51:07.996612+00:00"} {"global_step": 232705, "acc_step": 0, "speed/wps": 5525.973177777937, "speed/FLOPS": 244219729963009.4, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045362040400505066, "optim/lr": 2.2333329194904163e-05, "optim/total_tokens": 1952071024640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.286798357963562, "created_at": "2025-06-03T05:51:10.970358+00:00"} {"global_step": 232706, "acc_step": 0, "speed/wps": 5528.466584908423, "speed/FLOPS": 244329925795762.25, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04340827092528343, "optim/lr": 2.2329781969809616e-05, "optim/total_tokens": 1952079413248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2846651077270508, "created_at": "2025-06-03T05:51:13.938276+00:00"} {"global_step": 232707, "acc_step": 0, "speed/wps": 5532.0604067866025, "speed/FLOPS": 244488754327929.88, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.33, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.048112280666828156, "optim/lr": 2.2326234744715067e-05, "optim/total_tokens": 1952087801856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.3012661933898926, "created_at": "2025-06-03T05:51:16.904481+00:00"} {"global_step": 232708, "acc_step": 0, "speed/wps": 5529.589364407253, "speed/FLOPS": 244379546902704.1, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.046056415885686874, "optim/lr": 2.232268751962052e-05, "optim/total_tokens": 1952096190464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.3060309886932373, "created_at": "2025-06-03T05:51:19.875121+00:00"} {"global_step": 232709, "acc_step": 0, "speed/wps": 5503.1778615805515, "speed/FLOPS": 243212293664090.28, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045622821897268295, "optim/lr": 2.2319140294526197e-05, "optim/total_tokens": 1952104579072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2801830768585205, "created_at": "2025-06-03T05:51:22.856774+00:00"} {"global_step": 232710, "acc_step": 0, "speed/wps": 5506.9205207124005, "speed/FLOPS": 243377700041051.97, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042854443192481995, "optim/lr": 2.231559306943165e-05, "optim/total_tokens": 1952112967680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.28805673122406, "created_at": "2025-06-03T05:51:25.838878+00:00"} {"global_step": 232711, "acc_step": 0, "speed/wps": 5540.434272429053, "speed/FLOPS": 244858836327996.34, "speed/curr_iter_time": 2.9556, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9556, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.06, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.051920175552368164, "optim/lr": 2.2312045844337105e-05, "optim/total_tokens": 1952121356288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2853269577026367, "created_at": "2025-06-03T05:51:28.805900+00:00"} {"global_step": 232712, "acc_step": 0, "speed/wps": 5526.6498550766655, "speed/FLOPS": 244249635636064.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04371481016278267, "optim/lr": 2.2308498619242558e-05, "optim/total_tokens": 1952129744896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2834577560424805, "created_at": "2025-06-03T05:51:31.775707+00:00"} {"global_step": 232713, "acc_step": 0, "speed/wps": 5529.423843895988, "speed/FLOPS": 244372231743316.97, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.050124626606702805, "optim/lr": 2.2304951394148232e-05, "optim/total_tokens": 1952138133504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2951328754425049, "created_at": "2025-06-03T05:51:34.747084+00:00"} {"global_step": 232714, "acc_step": 0, "speed/wps": 5512.898293493079, "speed/FLOPS": 243641887000943.2, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05304820090532303, "optim/lr": 2.2301404169053686e-05, "optim/total_tokens": 1952146522112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2827823162078857, "created_at": "2025-06-03T05:51:37.723593+00:00"} {"global_step": 232715, "acc_step": 0, "speed/wps": 5516.922489839293, "speed/FLOPS": 243819735881741.72, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05114256218075752, "optim/lr": 2.229785694395914e-05, "optim/total_tokens": 1952154910720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2903422117233276, "created_at": "2025-06-03T05:51:40.697728+00:00"} {"global_step": 232716, "acc_step": 0, "speed/wps": 5519.47807249611, "speed/FLOPS": 243932679554515.22, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045189548283815384, "optim/lr": 2.2294309718864593e-05, "optim/total_tokens": 1952163299328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2909780740737915, "created_at": "2025-06-03T05:51:43.673561+00:00"} {"global_step": 232717, "acc_step": 0, "speed/wps": 5519.494976675939, "speed/FLOPS": 243933426632740.22, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.18 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.18, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04681052267551422, "optim/lr": 2.2290762493770267e-05, "optim/total_tokens": 1952171687936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3011138439178467, "created_at": "2025-06-03T05:51:46.648690+00:00"} {"global_step": 232718, "acc_step": 0, "speed/wps": 5498.223231453193, "speed/FLOPS": 242993324372556.97, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.2 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.2, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043161820620298386, "optim/lr": 2.228721526867572e-05, "optim/total_tokens": 1952180076544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2908211946487427, "created_at": "2025-06-03T05:51:49.635822+00:00"} {"global_step": 232719, "acc_step": 0, "speed/wps": 5538.905314540833, "speed/FLOPS": 244791264215252.94, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.17, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0484173409640789, "optim/lr": 2.2283668043581174e-05, "optim/total_tokens": 1952188465152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.3050509691238403, "created_at": "2025-06-03T05:51:52.599989+00:00"} {"global_step": 232720, "acc_step": 0, "speed/wps": 5534.852702405818, "speed/FLOPS": 244612159502034.56, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04482971131801605, "optim/lr": 2.2280120818486627e-05, "optim/total_tokens": 1952196853760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2743148803710938, "created_at": "2025-06-03T05:51:55.565394+00:00"} {"global_step": 232721, "acc_step": 0, "speed/wps": 5534.172302821551, "speed/FLOPS": 244582089323010.78, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.043299149721860886, "optim/lr": 2.22765735933923e-05, "optim/total_tokens": 1952205242368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2894126176834106, "created_at": "2025-06-03T05:51:58.530511+00:00"} {"global_step": 232722, "acc_step": 0, "speed/wps": 5532.307578042568, "speed/FLOPS": 244499678032306.38, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.39, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04269967973232269, "optim/lr": 2.2273026368297755e-05, "optim/total_tokens": 1952213630976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.308574914932251, "created_at": "2025-06-03T05:52:01.496682+00:00"} {"global_step": 232723, "acc_step": 0, "speed/wps": 5521.73617585787, "speed/FLOPS": 244032476165084.22, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04251941293478012, "optim/lr": 2.226947914320321e-05, "optim/total_tokens": 1952222019584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2768566608428955, "created_at": "2025-06-03T05:52:04.469826+00:00"} {"global_step": 232724, "acc_step": 0, "speed/wps": 5528.462048233453, "speed/FLOPS": 244329725297949.38, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04283059015870094, "optim/lr": 2.2265931918108662e-05, "optim/total_tokens": 1952230408192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2962123155593872, "created_at": "2025-06-03T05:52:07.437966+00:00"} {"global_step": 232725, "acc_step": 0, "speed/wps": 5517.764219904261, "speed/FLOPS": 243856936042248.28, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04241163656115532, "optim/lr": 2.2262384693014336e-05, "optim/total_tokens": 1952238796800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2916983366012573, "created_at": "2025-06-03T05:52:10.413773+00:00"} {"global_step": 232726, "acc_step": 0, "speed/wps": 5521.452652715845, "speed/FLOPS": 244019945893409.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04424535110592842, "optim/lr": 2.225883746791979e-05, "optim/total_tokens": 1952247185408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2840114831924438, "created_at": "2025-06-03T05:52:13.386245+00:00"} {"global_step": 232727, "acc_step": 0, "speed/wps": 5517.7828580831465, "speed/FLOPS": 243857759754356.16, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.042914293706417084, "optim/lr": 2.2255290242825243e-05, "optim/total_tokens": 1952255574016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2936781644821167, "created_at": "2025-06-03T05:52:16.361779+00:00"} {"global_step": 232728, "acc_step": 0, "speed/wps": 5526.806929915748, "speed/FLOPS": 244256577539970.3, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04349767044186592, "optim/lr": 2.2251743017730697e-05, "optim/total_tokens": 1952263962624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2889912128448486, "created_at": "2025-06-03T05:52:19.333960+00:00"} {"global_step": 232729, "acc_step": 0, "speed/wps": 5529.7834722095595, "speed/FLOPS": 244388125474032.22, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044509220868349075, "optim/lr": 2.224819579263637e-05, "optim/total_tokens": 1952272351232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2991936206817627, "created_at": "2025-06-03T05:52:22.305441+00:00"} {"global_step": 232730, "acc_step": 0, "speed/wps": 5528.580509794807, "speed/FLOPS": 244334960692619.97, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04413117840886116, "optim/lr": 2.2244648567541824e-05, "optim/total_tokens": 1952280739840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2720271348953247, "created_at": "2025-06-03T05:52:25.273862+00:00"} {"global_step": 232731, "acc_step": 0, "speed/wps": 5526.908466334283, "speed/FLOPS": 244261064929959.06, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044808901846408844, "optim/lr": 2.2241101342447278e-05, "optim/total_tokens": 1952289128448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2745755910873413, "created_at": "2025-06-03T05:52:28.243523+00:00"} {"global_step": 232732, "acc_step": 0, "speed/wps": 5528.118182558647, "speed/FLOPS": 244314528195187.03, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045955590903759, "optim/lr": 2.2237554117352955e-05, "optim/total_tokens": 1952297517056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2995405197143555, "created_at": "2025-06-03T05:52:31.211436+00:00"} {"global_step": 232733, "acc_step": 0, "speed/wps": 5520.836024543543, "speed/FLOPS": 243992694084383.1, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.044831372797489166, "optim/lr": 2.223400689225841e-05, "optim/total_tokens": 1952305905664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.282171607017517, "created_at": "2025-06-03T05:52:34.183617+00:00"} {"global_step": 232734, "acc_step": 0, "speed/wps": 5529.439813628531, "speed/FLOPS": 244372937523754.84, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.46, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045756857842206955, "optim/lr": 2.223045966716386e-05, "optim/total_tokens": 1952314294272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3001518249511719, "created_at": "2025-06-03T05:52:37.152232+00:00"} {"global_step": 232735, "acc_step": 0, "speed/wps": 5523.048182912296, "speed/FLOPS": 244090460161429.0, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.045346420258283615, "optim/lr": 2.2226912442069312e-05, "optim/total_tokens": 1952322682880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2904843091964722, "created_at": "2025-06-03T05:52:40.127652+00:00"} {"global_step": 232736, "acc_step": 0, "speed/wps": 5531.140092103899, "speed/FLOPS": 244448081129551.97, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04656211659312248, "optim/lr": 2.222336521697499e-05, "optim/total_tokens": 1952331071488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.299857497215271, "created_at": "2025-06-03T05:52:43.099257+00:00"} {"global_step": 232737, "acc_step": 0, "speed/wps": 5526.992103807701, "speed/FLOPS": 244264761278188.75, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04746706038713455, "optim/lr": 2.2219817991880443e-05, "optim/total_tokens": 1952339460096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2953897714614868, "created_at": "2025-06-03T05:52:46.069003+00:00"} {"global_step": 232738, "acc_step": 0, "speed/wps": 5524.892811085046, "speed/FLOPS": 244171983285001.62, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.053497061133384705, "optim/lr": 2.2216270766785897e-05, "optim/total_tokens": 1952347848704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2812896966934204, "created_at": "2025-06-03T05:52:49.042631+00:00"} {"global_step": 232739, "acc_step": 0, "speed/wps": 5522.434064790977, "speed/FLOPS": 244063319283808.16, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04325796291232109, "optim/lr": 2.2212723541691347e-05, "optim/total_tokens": 1952356237312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2813674211502075, "created_at": "2025-06-03T05:52:52.013846+00:00"} {"global_step": 232740, "acc_step": 0, "speed/wps": 5514.00309611369, "speed/FLOPS": 243690713621881.75, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.17 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.17, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.055013712495565414, "optim/lr": 2.2209176316597024e-05, "optim/total_tokens": 1952364625920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2771828174591064, "created_at": "2025-06-03T05:52:54.990009+00:00"} {"global_step": 232741, "acc_step": 0, "speed/wps": 5525.063738939679, "speed/FLOPS": 244179537421288.34, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04343659430742264, "optim/lr": 2.2205629091502478e-05, "optim/total_tokens": 1952373014528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2957978248596191, "created_at": "2025-06-03T05:52:57.960159+00:00"} {"global_step": 232742, "acc_step": 0, "speed/wps": 5522.764639019001, "speed/FLOPS": 244077928972654.56, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048570338636636734, "optim/lr": 2.220208186640793e-05, "optim/total_tokens": 1952381403136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2850141525268555, "created_at": "2025-06-03T05:53:00.931569+00:00"} {"global_step": 232743, "acc_step": 0, "speed/wps": 5521.618429420033, "speed/FLOPS": 244027272375212.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04433371126651764, "optim/lr": 2.2198534641313385e-05, "optim/total_tokens": 1952389791744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.282926082611084, "created_at": "2025-06-03T05:53:03.903741+00:00"} {"global_step": 232744, "acc_step": 0, "speed/wps": 5521.490757159138, "speed/FLOPS": 244021629914767.06, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046026021242141724, "optim/lr": 2.219498741621906e-05, "optim/total_tokens": 1952398180352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2936179637908936, "created_at": "2025-06-03T05:53:06.876345+00:00"} {"global_step": 232745, "acc_step": 0, "speed/wps": 5515.420998795315, "speed/FLOPS": 243753377662925.75, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04327818751335144, "optim/lr": 2.2191440191124513e-05, "optim/total_tokens": 1952406568960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.307751178741455, "created_at": "2025-06-03T05:53:09.851488+00:00"} {"global_step": 232746, "acc_step": 0, "speed/wps": 5518.761607288515, "speed/FLOPS": 243901015459540.88, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.054021820425987244, "optim/lr": 2.2187892966029966e-05, "optim/total_tokens": 1952414957568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.290047287940979, "created_at": "2025-06-03T05:53:12.827808+00:00"} {"global_step": 232747, "acc_step": 0, "speed/wps": 5522.8505000298155, "speed/FLOPS": 244081723589856.06, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04356703162193298, "optim/lr": 2.218434574093542e-05, "optim/total_tokens": 1952423346176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2855533361434937, "created_at": "2025-06-03T05:53:15.800789+00:00"} {"global_step": 232748, "acc_step": 0, "speed/wps": 5526.785487798055, "speed/FLOPS": 244255629908119.03, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.56, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.058186981827020645, "optim/lr": 2.2180798515841094e-05, "optim/total_tokens": 1952431734784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2871673107147217, "created_at": "2025-06-03T05:53:18.769561+00:00"} {"global_step": 232749, "acc_step": 0, "speed/wps": 5512.860817615604, "speed/FLOPS": 243640230758977.72, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04436151683330536, "optim/lr": 2.2177251290746547e-05, "optim/total_tokens": 1952440123392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2851214408874512, "created_at": "2025-06-03T05:53:21.746807+00:00"} {"global_step": 232750, "acc_step": 0, "speed/wps": 5522.412714230974, "speed/FLOPS": 244062375698338.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04791175201535225, "optim/lr": 2.2173704065652e-05, "optim/total_tokens": 1952448512000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2813652753829956, "created_at": "2025-06-03T05:53:24.717572+00:00"} {"global_step": 232751, "acc_step": 0, "speed/wps": 5526.192139717583, "speed/FLOPS": 244229406959992.94, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04248754680156708, "optim/lr": 2.2170156840557454e-05, "optim/total_tokens": 1952456900608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.27967369556427, "created_at": "2025-06-03T05:53:27.691873+00:00"} {"global_step": 232752, "acc_step": 0, "speed/wps": 5507.519037380732, "speed/FLOPS": 243404151414306.2, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.16 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.16, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.04209895804524422, "optim/lr": 2.216660961546313e-05, "optim/total_tokens": 1952465289216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2871216535568237, "created_at": "2025-06-03T05:53:30.672018+00:00"} {"global_step": 232753, "acc_step": 0, "speed/wps": 5516.626136888095, "speed/FLOPS": 243806638598170.7, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04621897265315056, "optim/lr": 2.2163062390368582e-05, "optim/total_tokens": 1952473677824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2980687618255615, "created_at": "2025-06-03T05:53:33.646154+00:00"} {"global_step": 232754, "acc_step": 0, "speed/wps": 5540.147227759831, "speed/FLOPS": 244846150422844.56, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.16, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04431480914354324, "optim/lr": 2.2159515165274036e-05, "optim/total_tokens": 1952482066432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2784786224365234, "created_at": "2025-06-03T05:53:36.607670+00:00"} {"global_step": 232755, "acc_step": 0, "speed/wps": 5527.241897423572, "speed/FLOPS": 244275800877450.6, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04447761923074722, "optim/lr": 2.215596794017949e-05, "optim/total_tokens": 1952490455040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2885969877243042, "created_at": "2025-06-03T05:53:39.576858+00:00"} {"global_step": 232756, "acc_step": 0, "speed/wps": 5532.182803398647, "speed/FLOPS": 244494163631699.56, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04487503692507744, "optim/lr": 2.2152420715085163e-05, "optim/total_tokens": 1952498843648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2930023670196533, "created_at": "2025-06-03T05:53:42.543816+00:00"} {"global_step": 232757, "acc_step": 0, "speed/wps": 5530.327890270616, "speed/FLOPS": 244412185965746.7, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.49, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04425573721528053, "optim/lr": 2.2148873489990617e-05, "optim/total_tokens": 1952507232256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2846927642822266, "created_at": "2025-06-03T05:53:45.514924+00:00"} {"global_step": 232758, "acc_step": 0, "speed/wps": 5520.247927250233, "speed/FLOPS": 243966703194173.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042683109641075134, "optim/lr": 2.214532626489607e-05, "optim/total_tokens": 1952515620864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.284568428993225, "created_at": "2025-06-03T05:53:48.489649+00:00"} {"global_step": 232759, "acc_step": 0, "speed/wps": 5509.143702381395, "speed/FLOPS": 243475953291546.2, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04301190748810768, "optim/lr": 2.2141779039801747e-05, "optim/total_tokens": 1952524009472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2821471691131592, "created_at": "2025-06-03T05:53:51.471125+00:00"} {"global_step": 232760, "acc_step": 0, "speed/wps": 5515.41679907847, "speed/FLOPS": 243753192056937.28, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04279569163918495, "optim/lr": 2.2138231814707198e-05, "optim/total_tokens": 1952532398080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2865362167358398, "created_at": "2025-06-03T05:53:54.445950+00:00"} {"global_step": 232761, "acc_step": 0, "speed/wps": 5507.152480505931, "speed/FLOPS": 243387951476648.16, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04352419823408127, "optim/lr": 2.213468458961265e-05, "optim/total_tokens": 1952540786688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.30062997341156, "created_at": "2025-06-03T05:53:57.425110+00:00"} {"global_step": 232762, "acc_step": 0, "speed/wps": 5511.232654551804, "speed/FLOPS": 243568274285251.8, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.15 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.15, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04504796862602234, "optim/lr": 2.2131137364518105e-05, "optim/total_tokens": 1952549175296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2953832149505615, "created_at": "2025-06-03T05:54:00.401779+00:00"} {"global_step": 232763, "acc_step": 0, "speed/wps": 5528.827777209052, "speed/FLOPS": 244345888646700.28, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.45, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04333885759115219, "optim/lr": 2.2127590139423782e-05, "optim/total_tokens": 1952557563904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.297824501991272, "created_at": "2025-06-03T05:54:03.368702+00:00"} {"global_step": 232764, "acc_step": 0, "speed/wps": 5520.468211343047, "speed/FLOPS": 243976438623559.78, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0024, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04307355359196663, "optim/lr": 2.2124042914329236e-05, "optim/total_tokens": 1952565952512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2854149341583252, "created_at": "2025-06-03T05:54:06.340593+00:00"} {"global_step": 232765, "acc_step": 0, "speed/wps": 5519.906113569991, "speed/FLOPS": 243951596779067.94, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04328668490052223, "optim/lr": 2.212049568923469e-05, "optim/total_tokens": 1952574341120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2942699193954468, "created_at": "2025-06-03T05:54:09.316016+00:00"} {"global_step": 232766, "acc_step": 0, "speed/wps": 5523.575003525208, "speed/FLOPS": 244113742936007.34, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.62, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04470966011285782, "optim/lr": 2.211694846414014e-05, "optim/total_tokens": 1952582729728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.3005009889602661, "created_at": "2025-06-03T05:54:12.285917+00:00"} {"global_step": 232767, "acc_step": 0, "speed/wps": 5519.523716530309, "speed/FLOPS": 243934696787199.44, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04254031926393509, "optim/lr": 2.2113401239045817e-05, "optim/total_tokens": 1952591118336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2922279834747314, "created_at": "2025-06-03T05:54:15.258055+00:00"} {"global_step": 232768, "acc_step": 0, "speed/wps": 5514.068509710005, "speed/FLOPS": 243693604568021.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04234769195318222, "optim/lr": 2.210985401395127e-05, "optim/total_tokens": 1952599506944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2850292921066284, "created_at": "2025-06-03T05:54:18.233942+00:00"} {"global_step": 232769, "acc_step": 0, "speed/wps": 5520.685237777522, "speed/FLOPS": 243986030081121.6, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048097580671310425, "optim/lr": 2.2106306788856724e-05, "optim/total_tokens": 1952607895552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2918850183486938, "created_at": "2025-06-03T05:54:21.205709+00:00"} {"global_step": 232770, "acc_step": 0, "speed/wps": 5526.075939889794, "speed/FLOPS": 244224271522369.3, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04268965125083923, "optim/lr": 2.2102759563762178e-05, "optim/total_tokens": 1952616284160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.271270513534546, "created_at": "2025-06-03T05:54:24.176376+00:00"} {"global_step": 232771, "acc_step": 0, "speed/wps": 5518.680053377385, "speed/FLOPS": 243897411194099.7, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05364658311009407, "optim/lr": 2.209921233866785e-05, "optim/total_tokens": 1952624672768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.289473056793213, "created_at": "2025-06-03T05:54:27.152955+00:00"} {"global_step": 232772, "acc_step": 0, "speed/wps": 5510.111446106548, "speed/FLOPS": 243518722610836.53, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04441426321864128, "optim/lr": 2.2095665113573305e-05, "optim/total_tokens": 1952633061376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.293066143989563, "created_at": "2025-06-03T05:54:30.132731+00:00"} {"global_step": 232773, "acc_step": 0, "speed/wps": 5520.340819625804, "speed/FLOPS": 243970808561707.56, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.049759384244680405, "optim/lr": 2.209211788847876e-05, "optim/total_tokens": 1952641449984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3009936809539795, "created_at": "2025-06-03T05:54:33.104533+00:00"} {"global_step": 232774, "acc_step": 0, "speed/wps": 5521.801283440511, "speed/FLOPS": 244035353586986.12, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04271949082612991, "optim/lr": 2.2088570663384212e-05, "optim/total_tokens": 1952649838592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2939938306808472, "created_at": "2025-06-03T05:54:36.075196+00:00"} {"global_step": 232775, "acc_step": 0, "speed/wps": 5518.388608161046, "speed/FLOPS": 243884530807289.38, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04860500246286392, "optim/lr": 2.2085023438289886e-05, "optim/total_tokens": 1952658227200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2942490577697754, "created_at": "2025-06-03T05:54:39.051202+00:00"} {"global_step": 232776, "acc_step": 0, "speed/wps": 5516.826027027153, "speed/FLOPS": 243815472719186.56, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04277457669377327, "optim/lr": 2.208147621319534e-05, "optim/total_tokens": 1952666615808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2944586277008057, "created_at": "2025-06-03T05:54:42.024550+00:00"} {"global_step": 232777, "acc_step": 0, "speed/wps": 5504.035349599807, "speed/FLOPS": 243250190245519.8, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.14 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.14, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04666709899902344, "optim/lr": 2.2077928988100793e-05, "optim/total_tokens": 1952675004416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.290906548500061, "created_at": "2025-06-03T05:54:45.005067+00:00"} {"global_step": 232778, "acc_step": 0, "speed/wps": 5487.306182019256, "speed/FLOPS": 242510846666101.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045207809656858444, "optim/lr": 2.2074381763006247e-05, "optim/total_tokens": 1952683393024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2913755178451538, "created_at": "2025-06-03T05:54:47.993867+00:00"} {"global_step": 232779, "acc_step": 0, "speed/wps": 5529.640871132507, "speed/FLOPS": 244381823236324.97, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04247593879699707, "optim/lr": 2.207083453791192e-05, "optim/total_tokens": 1952691781632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.293375849723816, "created_at": "2025-06-03T05:54:50.964421+00:00"} {"global_step": 232780, "acc_step": 0, "speed/wps": 5531.985166700271, "speed/FLOPS": 244485429101227.7, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043990910053253174, "optim/lr": 2.2067287312817374e-05, "optim/total_tokens": 1952700170240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2880444526672363, "created_at": "2025-06-03T05:54:53.929989+00:00"} {"global_step": 232781, "acc_step": 0, "speed/wps": 5515.081023992203, "speed/FLOPS": 243738352516776.97, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04577842354774475, "optim/lr": 2.2063740087722828e-05, "optim/total_tokens": 1952708558848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2823152542114258, "created_at": "2025-06-03T05:54:56.904377+00:00"} {"global_step": 232782, "acc_step": 0, "speed/wps": 5521.888171767788, "speed/FLOPS": 244039193606317.0, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0447714626789093, "optim/lr": 2.206019286262828e-05, "optim/total_tokens": 1952716947456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.292610764503479, "created_at": "2025-06-03T05:54:59.874522+00:00"} {"global_step": 232783, "acc_step": 0, "speed/wps": 5529.344126091269, "speed/FLOPS": 244368708624381.06, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.047807008028030396, "optim/lr": 2.2056645637533955e-05, "optim/total_tokens": 1952725336064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2839940786361694, "created_at": "2025-06-03T05:55:02.844599+00:00"} {"global_step": 232784, "acc_step": 0, "speed/wps": 5515.311720051774, "speed/FLOPS": 243748548101800.53, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04900667816400528, "optim/lr": 2.205309841243941e-05, "optim/total_tokens": 1952733724672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2825971841812134, "created_at": "2025-06-03T05:55:05.818396+00:00"} {"global_step": 232785, "acc_step": 0, "speed/wps": 5508.927628988536, "speed/FLOPS": 243466403953545.7, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04807925224304199, "optim/lr": 2.2049551187344863e-05, "optim/total_tokens": 1952742113280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2701473236083984, "created_at": "2025-06-03T05:55:08.796026+00:00"} {"global_step": 232786, "acc_step": 0, "speed/wps": 5522.075748381138, "speed/FLOPS": 244047483532522.9, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04909684509038925, "optim/lr": 2.204600396225054e-05, "optim/total_tokens": 1952750501888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.28804612159729, "created_at": "2025-06-03T05:55:11.766722+00:00"} {"global_step": 232787, "acc_step": 0, "speed/wps": 5524.298184436691, "speed/FLOPS": 244145703830719.47, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04685453698039055, "optim/lr": 2.204245673715599e-05, "optim/total_tokens": 1952758890496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.294479250907898, "created_at": "2025-06-03T05:55:14.736000+00:00"} {"global_step": 232788, "acc_step": 0, "speed/wps": 5516.715045225801, "speed/FLOPS": 243810567891623.16, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04406479373574257, "optim/lr": 2.2038909512061444e-05, "optim/total_tokens": 1952767279104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2869303226470947, "created_at": "2025-06-03T05:55:17.711637+00:00"} {"global_step": 232789, "acc_step": 0, "speed/wps": 5505.2394958952855, "speed/FLOPS": 243303407348400.5, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.052851203829050064, "optim/lr": 2.2035362286966897e-05, "optim/total_tokens": 1952775667712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2862532138824463, "created_at": "2025-06-03T05:55:20.691010+00:00"} {"global_step": 232790, "acc_step": 0, "speed/wps": 5514.295864208487, "speed/FLOPS": 243703652473148.8, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04635246843099594, "optim/lr": 2.2031815061872574e-05, "optim/total_tokens": 1952784056320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.293031096458435, "created_at": "2025-06-03T05:55:23.668117+00:00"} {"global_step": 232791, "acc_step": 0, "speed/wps": 5521.543722654357, "speed/FLOPS": 244023970718553.75, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04983210936188698, "optim/lr": 2.2028267836778028e-05, "optim/total_tokens": 1952792444928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2905761003494263, "created_at": "2025-06-03T05:55:26.639454+00:00"} {"global_step": 232792, "acc_step": 0, "speed/wps": 5506.471371597694, "speed/FLOPS": 243357849949135.53, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042610831558704376, "optim/lr": 2.2024720611683478e-05, "optim/total_tokens": 1952800833536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2759966850280762, "created_at": "2025-06-03T05:55:29.620859+00:00"} {"global_step": 232793, "acc_step": 0, "speed/wps": 5508.945541193403, "speed/FLOPS": 243467195581317.88, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.13 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.13, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05804356932640076, "optim/lr": 2.2021173386588932e-05, "optim/total_tokens": 1952809222144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2922970056533813, "created_at": "2025-06-03T05:55:32.600077+00:00"} {"global_step": 232794, "acc_step": 0, "speed/wps": 5518.377431784442, "speed/FLOPS": 243884036868649.3, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.12 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.12, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04279391095042229, "optim/lr": 2.201762616149461e-05, "optim/total_tokens": 1952817610752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2937687635421753, "created_at": "2025-06-03T05:55:35.572491+00:00"} {"global_step": 232795, "acc_step": 0, "speed/wps": 5518.095723803811, "speed/FLOPS": 243871586817817.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05569421127438545, "optim/lr": 2.2014078936400063e-05, "optim/total_tokens": 1952825999360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2860134840011597, "created_at": "2025-06-03T05:55:38.545610+00:00"} {"global_step": 232796, "acc_step": 0, "speed/wps": 5525.768835724507, "speed/FLOPS": 244210699090165.22, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044495660811662674, "optim/lr": 2.2010531711305516e-05, "optim/total_tokens": 1952834387968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.285772442817688, "created_at": "2025-06-03T05:55:41.513825+00:00"} {"global_step": 232797, "acc_step": 0, "speed/wps": 5531.097114679123, "speed/FLOPS": 244446181747355.22, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04741056635975838, "optim/lr": 2.2006984486210966e-05, "optim/total_tokens": 1952842776576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2949548959732056, "created_at": "2025-06-03T05:55:44.479136+00:00"} {"global_step": 232798, "acc_step": 0, "speed/wps": 5520.780511075506, "speed/FLOPS": 243990240673239.53, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04323607683181763, "optim/lr": 2.2003437261116644e-05, "optim/total_tokens": 1952851165184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.292379379272461, "created_at": "2025-06-03T05:55:47.454441+00:00"} {"global_step": 232799, "acc_step": 0, "speed/wps": 5516.88395577972, "speed/FLOPS": 243818032873543.78, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04869040101766586, "optim/lr": 2.1999890036022097e-05, "optim/total_tokens": 1952859553792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.288321614265442, "created_at": "2025-06-03T05:55:50.430993+00:00"} {"global_step": 232800, "acc_step": 0, "speed/wps": 5534.3752058789905, "speed/FLOPS": 244591056599597.6, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04442985728383064, "optim/lr": 2.199634281092755e-05, "optim/total_tokens": 1952867942400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2704535722732544, "created_at": "2025-06-03T05:55:53.395853+00:00"} {"global_step": 232801, "acc_step": 0, "speed/wps": 5519.736523025565, "speed/FLOPS": 243944101745047.38, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.049256183207035065, "optim/lr": 2.1992795585833005e-05, "optim/total_tokens": 1952876331008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.272697925567627, "created_at": "2025-06-03T05:55:56.367689+00:00"} {"global_step": 232802, "acc_step": 0, "speed/wps": 5516.000014002127, "speed/FLOPS": 243778967171398.3, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04564758390188217, "optim/lr": 2.198924836073868e-05, "optim/total_tokens": 1952884719616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2844157218933105, "created_at": "2025-06-03T05:55:59.342411+00:00"} {"global_step": 232803, "acc_step": 0, "speed/wps": 5520.210263908246, "speed/FLOPS": 243965038667236.22, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04433273896574974, "optim/lr": 2.1985701135644132e-05, "optim/total_tokens": 1952893108224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.298807144165039, "created_at": "2025-06-03T05:56:02.315394+00:00"} {"global_step": 232804, "acc_step": 0, "speed/wps": 5530.178574214837, "speed/FLOPS": 244405586960350.1, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04493452608585358, "optim/lr": 2.1982153910549586e-05, "optim/total_tokens": 1952901496832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.281017541885376, "created_at": "2025-06-03T05:56:05.281891+00:00"} {"global_step": 232805, "acc_step": 0, "speed/wps": 5527.562754838741, "speed/FLOPS": 244289981132903.97, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04303720220923424, "optim/lr": 2.197860668545504e-05, "optim/total_tokens": 1952909885440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2928980588912964, "created_at": "2025-06-03T05:56:08.249314+00:00"} {"global_step": 232806, "acc_step": 0, "speed/wps": 5527.5063622452035, "speed/FLOPS": 244287488868913.06, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.61, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.08096310496330261, "optim/lr": 2.1975059460360713e-05, "optim/total_tokens": 1952918274048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.287083625793457, "created_at": "2025-06-03T05:56:11.216551+00:00"} {"global_step": 232807, "acc_step": 0, "speed/wps": 5520.014790701875, "speed/FLOPS": 243956399752037.22, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045216042548418045, "optim/lr": 2.1971512235266167e-05, "optim/total_tokens": 1952926662656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3030532598495483, "created_at": "2025-06-03T05:56:14.187822+00:00"} {"global_step": 232808, "acc_step": 0, "speed/wps": 5519.101812672322, "speed/FLOPS": 243916050796176.12, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04333293065428734, "optim/lr": 2.196796501017162e-05, "optim/total_tokens": 1952935051264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2880804538726807, "created_at": "2025-06-03T05:56:17.161008+00:00"} {"global_step": 232809, "acc_step": 0, "speed/wps": 5514.608061048001, "speed/FLOPS": 243717449975487.06, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04452366754412651, "optim/lr": 2.1964417785077074e-05, "optim/total_tokens": 1952943439872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2804967164993286, "created_at": "2025-06-03T05:56:20.134974+00:00"} {"global_step": 232810, "acc_step": 0, "speed/wps": 5507.787516832861, "speed/FLOPS": 243416016831887.9, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04337732121348381, "optim/lr": 2.1960870559982748e-05, "optim/total_tokens": 1952951828480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2938005924224854, "created_at": "2025-06-03T05:56:23.113146+00:00"} {"global_step": 232811, "acc_step": 0, "speed/wps": 5517.82559120652, "speed/FLOPS": 243859648339681.3, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044039804488420486, "optim/lr": 2.19573233348882e-05, "optim/total_tokens": 1952960217088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.284848690032959, "created_at": "2025-06-03T05:56:26.091030+00:00"} {"global_step": 232812, "acc_step": 0, "speed/wps": 5504.909617960636, "speed/FLOPS": 243288828432157.3, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04583040997385979, "optim/lr": 2.1953776109793655e-05, "optim/total_tokens": 1952968605696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2834104299545288, "created_at": "2025-06-03T05:56:29.073291+00:00"} {"global_step": 232813, "acc_step": 0, "speed/wps": 5519.428661071635, "speed/FLOPS": 243930495822464.03, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04341888055205345, "optim/lr": 2.195022888469933e-05, "optim/total_tokens": 1952976994304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.275638222694397, "created_at": "2025-06-03T05:56:32.045112+00:00"} {"global_step": 232814, "acc_step": 0, "speed/wps": 5525.8449386894445, "speed/FLOPS": 244214062451685.2, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 191.66, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048133451491594315, "optim/lr": 2.1946681659604782e-05, "optim/total_tokens": 1952985382912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.273977279663086, "created_at": "2025-06-03T05:56:35.013923+00:00"} {"global_step": 232815, "acc_step": 0, "speed/wps": 5520.920568148149, "speed/FLOPS": 243996430478973.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04218984767794609, "optim/lr": 2.1943134434510236e-05, "optim/total_tokens": 1952993771520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2794413566589355, "created_at": "2025-06-03T05:56:37.987886+00:00"} {"global_step": 232816, "acc_step": 0, "speed/wps": 5521.3810800669535, "speed/FLOPS": 244016782748670.75, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045337289571762085, "optim/lr": 2.193958720941569e-05, "optim/total_tokens": 1953002160128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2947735786437988, "created_at": "2025-06-03T05:56:40.958549+00:00"} {"global_step": 232817, "acc_step": 0, "speed/wps": 5504.3311852915085, "speed/FLOPS": 243263264668868.7, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.11 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.11, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04412328451871872, "optim/lr": 2.1936039984321367e-05, "optim/total_tokens": 1953010548736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.299074649810791, "created_at": "2025-06-03T05:56:43.938427+00:00"} {"global_step": 232818, "acc_step": 0, "speed/wps": 5513.929567837101, "speed/FLOPS": 243687464048408.34, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.047984734177589417, "optim/lr": 2.1932492759226817e-05, "optim/total_tokens": 1953018937344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2843246459960938, "created_at": "2025-06-03T05:56:46.912876+00:00"} {"global_step": 232819, "acc_step": 0, "speed/wps": 5513.196028680405, "speed/FLOPS": 243655045372276.16, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04329921677708626, "optim/lr": 2.192894553413227e-05, "optim/total_tokens": 1953027325952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.296985149383545, "created_at": "2025-06-03T05:56:49.891011+00:00"} {"global_step": 232820, "acc_step": 0, "speed/wps": 5525.048370130708, "speed/FLOPS": 244178858198596.5, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05325055867433548, "optim/lr": 2.1925398309037724e-05, "optim/total_tokens": 1953035714560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2844009399414062, "created_at": "2025-06-03T05:56:52.860002+00:00"} {"global_step": 232821, "acc_step": 0, "speed/wps": 5534.619344039938, "speed/FLOPS": 244601846256699.1, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.37, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0435328371822834, "optim/lr": 2.19218510839434e-05, "optim/total_tokens": 1953044103168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2968668937683105, "created_at": "2025-06-03T05:56:55.823341+00:00"} {"global_step": 232822, "acc_step": 0, "speed/wps": 5526.005703243883, "speed/FLOPS": 244221167422123.75, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05914555490016937, "optim/lr": 2.1918303858848855e-05, "optim/total_tokens": 1953052491776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.297711730003357, "created_at": "2025-06-03T05:56:58.791527+00:00"} {"global_step": 232823, "acc_step": 0, "speed/wps": 5531.387530269392, "speed/FLOPS": 244459016629963.4, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.48, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0431499257683754, "optim/lr": 2.191475663375431e-05, "optim/total_tokens": 1953060880384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.280404806137085, "created_at": "2025-06-03T05:57:01.757257+00:00"} {"global_step": 232824, "acc_step": 0, "speed/wps": 5537.348186631277, "speed/FLOPS": 244722447131753.7, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.06011351943016052, "optim/lr": 2.191120940865976e-05, "optim/total_tokens": 1953069268992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.3041785955429077, "created_at": "2025-06-03T05:57:04.719449+00:00"} {"global_step": 232825, "acc_step": 0, "speed/wps": 5510.057539537187, "speed/FLOPS": 243516340216389.62, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.1 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.1, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0456140860915184, "optim/lr": 2.1907662183565436e-05, "optim/total_tokens": 1953077657600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.284535527229309, "created_at": "2025-06-03T05:57:07.696647+00:00"} {"global_step": 232826, "acc_step": 0, "speed/wps": 5524.5698914917675, "speed/FLOPS": 244157711891831.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0562276765704155, "optim/lr": 2.190411495847089e-05, "optim/total_tokens": 1953086046208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2981173992156982, "created_at": "2025-06-03T05:57:10.665768+00:00"} {"global_step": 232827, "acc_step": 0, "speed/wps": 5514.966674498443, "speed/FLOPS": 243733298854446.56, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048284150660037994, "optim/lr": 2.1900567733376343e-05, "optim/total_tokens": 1953094434816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3067774772644043, "created_at": "2025-06-03T05:57:13.640244+00:00"} {"global_step": 232828, "acc_step": 0, "speed/wps": 5522.59405362509, "speed/FLOPS": 244070389971378.88, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04504720866680145, "optim/lr": 2.1897020508281797e-05, "optim/total_tokens": 1953102823424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2851375341415405, "created_at": "2025-06-03T05:57:16.610090+00:00"} {"global_step": 232829, "acc_step": 0, "speed/wps": 5521.7716719174, "speed/FLOPS": 244034044909230.16, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05414624139666557, "optim/lr": 2.189347328318747e-05, "optim/total_tokens": 1953111212032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.288651466369629, "created_at": "2025-06-03T05:57:19.580281+00:00"} {"global_step": 232830, "acc_step": 0, "speed/wps": 5515.191032319855, "speed/FLOPS": 243743214321785.56, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04348478838801384, "optim/lr": 2.1889926058092924e-05, "optim/total_tokens": 1953119600640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2851941585540771, "created_at": "2025-06-03T05:57:22.554627+00:00"} {"global_step": 232831, "acc_step": 0, "speed/wps": 5525.882561797425, "speed/FLOPS": 244215725200485.4, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0536462776362896, "optim/lr": 2.1886378832998378e-05, "optim/total_tokens": 1953127989248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2831624746322632, "created_at": "2025-06-03T05:57:25.524690+00:00"} {"global_step": 232832, "acc_step": 0, "speed/wps": 5515.280026248091, "speed/FLOPS": 243747147397901.38, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04540641978383064, "optim/lr": 2.188283160790383e-05, "optim/total_tokens": 1953136377856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.293778896331787, "created_at": "2025-06-03T05:57:28.498976+00:00"} {"global_step": 232833, "acc_step": 0, "speed/wps": 5512.439779704906, "speed/FLOPS": 243621623038392.25, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05082124099135399, "optim/lr": 2.1879284382809505e-05, "optim/total_tokens": 1953144766464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2797576189041138, "created_at": "2025-06-03T05:57:31.475354+00:00"} {"global_step": 232834, "acc_step": 0, "speed/wps": 5521.386176555607, "speed/FLOPS": 244017007987383.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04853440821170807, "optim/lr": 2.187573715771496e-05, "optim/total_tokens": 1953153155072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3001151084899902, "created_at": "2025-06-03T05:57:34.446080+00:00"} {"global_step": 232835, "acc_step": 0, "speed/wps": 5508.071695687594, "speed/FLOPS": 243428576082707.84, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.25, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04603654146194458, "optim/lr": 2.1872189932620413e-05, "optim/total_tokens": 1953161543680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2642306089401245, "created_at": "2025-06-03T05:57:37.424019+00:00"} {"global_step": 232836, "acc_step": 0, "speed/wps": 5508.074582609535, "speed/FLOPS": 243428703669881.06, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046473030000925064, "optim/lr": 2.1868642707525866e-05, "optim/total_tokens": 1953169932288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2883727550506592, "created_at": "2025-06-03T05:57:40.404455+00:00"} {"global_step": 232837, "acc_step": 0, "speed/wps": 5519.065022038092, "speed/FLOPS": 243914424838454.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04345938563346863, "optim/lr": 2.186509548243154e-05, "optim/total_tokens": 1953178320896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.276651382446289, "created_at": "2025-06-03T05:57:43.380292+00:00"} {"global_step": 232838, "acc_step": 0, "speed/wps": 5525.660637860941, "speed/FLOPS": 244205917298402.5, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04755648598074913, "optim/lr": 2.1861548257336994e-05, "optim/total_tokens": 1953186709504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2805137634277344, "created_at": "2025-06-03T05:57:46.352654+00:00"} {"global_step": 232839, "acc_step": 0, "speed/wps": 5521.315004189499, "speed/FLOPS": 244013862533094.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04320486634969711, "optim/lr": 2.1858001032242447e-05, "optim/total_tokens": 1953195098112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.304223895072937, "created_at": "2025-06-03T05:57:49.324259+00:00"} {"global_step": 232840, "acc_step": 0, "speed/wps": 5541.429832380073, "speed/FLOPS": 244902834982093.66, "speed/curr_iter_time": 2.9554, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9554, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.15, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04635072872042656, "optim/lr": 2.185445380714812e-05, "optim/total_tokens": 1953203486720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2898491621017456, "created_at": "2025-06-03T05:57:52.284588+00:00"} {"global_step": 232841, "acc_step": 0, "speed/wps": 5505.228650085153, "speed/FLOPS": 243302928019106.53, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04269839823246002, "optim/lr": 2.1850906582053575e-05, "optim/total_tokens": 1953211875328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2903721332550049, "created_at": "2025-06-03T05:57:55.264247+00:00"} {"global_step": 232842, "acc_step": 0, "speed/wps": 5517.1198229719985, "speed/FLOPS": 243828456996164.75, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04494831711053848, "optim/lr": 2.1847359356959028e-05, "optim/total_tokens": 1953220263936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2814338207244873, "created_at": "2025-06-03T05:57:58.240368+00:00"} {"global_step": 232843, "acc_step": 0, "speed/wps": 5518.352758316911, "speed/FLOPS": 243882946427674.72, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04270085319876671, "optim/lr": 2.1843812131864482e-05, "optim/total_tokens": 1953228652544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.296820878982544, "created_at": "2025-06-03T05:58:01.215957+00:00"} {"global_step": 232844, "acc_step": 0, "speed/wps": 5511.4636404415405, "speed/FLOPS": 243578482679285.2, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04314768686890602, "optim/lr": 2.184026490677016e-05, "optim/total_tokens": 1953237041152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2755093574523926, "created_at": "2025-06-03T05:58:04.197775+00:00"} {"global_step": 232845, "acc_step": 0, "speed/wps": 5504.4665734075115, "speed/FLOPS": 243269248130616.8, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.09 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.09, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04220126196742058, "optim/lr": 2.183671768167561e-05, "optim/total_tokens": 1953245429760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2928705215454102, "created_at": "2025-06-03T05:58:07.178549+00:00"} {"global_step": 232846, "acc_step": 0, "speed/wps": 5520.301904778111, "speed/FLOPS": 243969088724623.75, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0431363582611084, "optim/lr": 2.1833170456581063e-05, "optim/total_tokens": 1953253818368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2897298336029053, "created_at": "2025-06-03T05:58:10.153431+00:00"} {"global_step": 232847, "acc_step": 0, "speed/wps": 5520.625768726309, "speed/FLOPS": 243983401853448.16, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04368797317147255, "optim/lr": 2.1829623231486517e-05, "optim/total_tokens": 1953262206976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.30348539352417, "created_at": "2025-06-03T05:58:13.124752+00:00"} {"global_step": 232848, "acc_step": 0, "speed/wps": 5519.014957470539, "speed/FLOPS": 243912212240822.56, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04254123196005821, "optim/lr": 2.1826076006392194e-05, "optim/total_tokens": 1953270595584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.3056942224502563, "created_at": "2025-06-03T05:58:16.097307+00:00"} {"global_step": 232849, "acc_step": 0, "speed/wps": 5517.772275174909, "speed/FLOPS": 243857292043980.28, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04340603947639465, "optim/lr": 2.1822528781297647e-05, "optim/total_tokens": 1953278984192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.289282202720642, "created_at": "2025-06-03T05:58:19.070376+00:00"} {"global_step": 232850, "acc_step": 0, "speed/wps": 5519.171428060176, "speed/FLOPS": 243919127439995.44, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04381152614951134, "optim/lr": 2.1818981556203098e-05, "optim/total_tokens": 1953287372800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2791686058044434, "created_at": "2025-06-03T05:58:22.045696+00:00"} {"global_step": 232851, "acc_step": 0, "speed/wps": 5519.511183502967, "speed/FLOPS": 243934142891540.75, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04628262668848038, "optim/lr": 2.181543433110855e-05, "optim/total_tokens": 1953295761408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2847121953964233, "created_at": "2025-06-03T05:58:25.017517+00:00"} {"global_step": 232852, "acc_step": 0, "speed/wps": 5508.520004174858, "speed/FLOPS": 243448389023194.06, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.08 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.08, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04257490858435631, "optim/lr": 2.181188710601423e-05, "optim/total_tokens": 1953304150016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2795963287353516, "created_at": "2025-06-03T05:58:27.998546+00:00"} {"global_step": 232853, "acc_step": 0, "speed/wps": 5512.127839109102, "speed/FLOPS": 243607836860714.44, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04325218126177788, "optim/lr": 2.1808339880919682e-05, "optim/total_tokens": 1953312538624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3005369901657104, "created_at": "2025-06-03T05:58:30.977701+00:00"} {"global_step": 232854, "acc_step": 0, "speed/wps": 5517.310343966048, "speed/FLOPS": 243836877048926.9, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044577743858098984, "optim/lr": 2.1804792655825136e-05, "optim/total_tokens": 1953320927232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2840911149978638, "created_at": "2025-06-03T05:58:33.950841+00:00"} {"global_step": 232855, "acc_step": 0, "speed/wps": 5521.154270288204, "speed/FLOPS": 244006758917367.72, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043171271681785583, "optim/lr": 2.1801245430730586e-05, "optim/total_tokens": 1953329315840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2977604866027832, "created_at": "2025-06-03T05:58:36.922399+00:00"} {"global_step": 232856, "acc_step": 0, "speed/wps": 5517.78417034929, "speed/FLOPS": 243857817749802.94, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044636428356170654, "optim/lr": 2.1797698205636263e-05, "optim/total_tokens": 1953337704448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.277368426322937, "created_at": "2025-06-03T05:58:39.895383+00:00"} {"global_step": 232857, "acc_step": 0, "speed/wps": 5521.578553787839, "speed/FLOPS": 244025510076371.75, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04367890581488609, "optim/lr": 2.1794150980541717e-05, "optim/total_tokens": 1953346093056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2908074855804443, "created_at": "2025-06-03T05:58:42.866299+00:00"} {"global_step": 232858, "acc_step": 0, "speed/wps": 5519.404398132281, "speed/FLOPS": 243929423524733.53, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04385487362742424, "optim/lr": 2.179060375544717e-05, "optim/total_tokens": 1953354481664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2922509908676147, "created_at": "2025-06-03T05:58:45.840136+00:00"} {"global_step": 232859, "acc_step": 0, "speed/wps": 5509.352597074944, "speed/FLOPS": 243485185367781.1, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046393219381570816, "optim/lr": 2.1787056530352624e-05, "optim/total_tokens": 1953362870272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2784793376922607, "created_at": "2025-06-03T05:58:48.818004+00:00"} {"global_step": 232860, "acc_step": 0, "speed/wps": 5508.20187404176, "speed/FLOPS": 243434329299648.78, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04399716481566429, "optim/lr": 2.1783509305258298e-05, "optim/total_tokens": 1953371258880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2887547016143799, "created_at": "2025-06-03T05:58:51.799187+00:00"} {"global_step": 232861, "acc_step": 0, "speed/wps": 5525.242160984307, "speed/FLOPS": 244187422762414.1, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0450417622923851, "optim/lr": 2.177996208016375e-05, "optim/total_tokens": 1953379647488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2873960733413696, "created_at": "2025-06-03T05:58:54.768636+00:00"} {"global_step": 232862, "acc_step": 0, "speed/wps": 5525.341180425824, "speed/FLOPS": 244191798914901.7, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04409833997488022, "optim/lr": 2.1776414855069205e-05, "optim/total_tokens": 1953388036096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.282216191291809, "created_at": "2025-06-03T05:58:57.738097+00:00"} {"global_step": 232863, "acc_step": 0, "speed/wps": 5505.500031281961, "speed/FLOPS": 243314921678950.56, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04380573332309723, "optim/lr": 2.177286762997466e-05, "optim/total_tokens": 1953396424704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2967588901519775, "created_at": "2025-06-03T05:59:00.718266+00:00"} {"global_step": 232864, "acc_step": 0, "speed/wps": 5521.239557489149, "speed/FLOPS": 244010528175110.0, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04591064527630806, "optim/lr": 2.1769320404880332e-05, "optim/total_tokens": 1953404813312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.288780689239502, "created_at": "2025-06-03T05:59:03.693472+00:00"} {"global_step": 232865, "acc_step": 0, "speed/wps": 5517.799300178348, "speed/FLOPS": 243858486410805.78, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045014698058366776, "optim/lr": 2.1765773179785786e-05, "optim/total_tokens": 1953413201920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.294589638710022, "created_at": "2025-06-03T05:59:06.669817+00:00"} {"global_step": 232866, "acc_step": 0, "speed/wps": 5518.082890469428, "speed/FLOPS": 243871019650124.84, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04417617246508598, "optim/lr": 2.176222595469124e-05, "optim/total_tokens": 1953421590528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.291835069656372, "created_at": "2025-06-03T05:59:09.643090+00:00"} {"global_step": 232867, "acc_step": 0, "speed/wps": 5518.667955684143, "speed/FLOPS": 243896876537980.0, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0439799502491951, "optim/lr": 2.1758678729596913e-05, "optim/total_tokens": 1953429979136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2962918281555176, "created_at": "2025-06-03T05:59:12.619163+00:00"} {"global_step": 232868, "acc_step": 0, "speed/wps": 5503.648954512594, "speed/FLOPS": 243233113560414.34, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044184960424900055, "optim/lr": 2.1755131504502367e-05, "optim/total_tokens": 1953438367744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.285935401916504, "created_at": "2025-06-03T05:59:15.602593+00:00"} {"global_step": 232869, "acc_step": 0, "speed/wps": 5503.6880933614075, "speed/FLOPS": 243234843297201.12, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.07 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.07, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04274025931954384, "optim/lr": 2.175158427940782e-05, "optim/total_tokens": 1953446756352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2897896766662598, "created_at": "2025-06-03T05:59:18.583906+00:00"} {"global_step": 232870, "acc_step": 0, "speed/wps": 5505.843440054743, "speed/FLOPS": 243330098588982.1, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.06 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.06, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04359529912471771, "optim/lr": 2.1748037054313274e-05, "optim/total_tokens": 1953455144960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2906311750411987, "created_at": "2025-06-03T05:59:21.567687+00:00"} {"global_step": 232871, "acc_step": 0, "speed/wps": 5520.51330224027, "speed/FLOPS": 243978431410420.88, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04352577403187752, "optim/lr": 2.1744489829218948e-05, "optim/total_tokens": 1953463533568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2907277345657349, "created_at": "2025-06-03T05:59:24.539942+00:00"} {"global_step": 232872, "acc_step": 0, "speed/wps": 5529.747783988877, "speed/FLOPS": 244386548237346.94, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042962346225976944, "optim/lr": 2.17409426041244e-05, "optim/total_tokens": 1953471922176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2832287549972534, "created_at": "2025-06-03T05:59:27.506355+00:00"} {"global_step": 232873, "acc_step": 0, "speed/wps": 5525.078452350879, "speed/FLOPS": 244180187678753.3, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044295117259025574, "optim/lr": 2.1737395379029855e-05, "optim/total_tokens": 1953480310784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2901504039764404, "created_at": "2025-06-03T05:59:30.475479+00:00"} {"global_step": 232874, "acc_step": 0, "speed/wps": 5516.2562141885355, "speed/FLOPS": 243790289908286.16, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04365931451320648, "optim/lr": 2.173384815393531e-05, "optim/total_tokens": 1953488699392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2948675155639648, "created_at": "2025-06-03T05:59:33.452661+00:00"} {"global_step": 232875, "acc_step": 0, "speed/wps": 5516.7880241356925, "speed/FLOPS": 243813793185900.44, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046704281121492386, "optim/lr": 2.1730300928840986e-05, "optim/total_tokens": 1953497088000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.28388512134552, "created_at": "2025-06-03T05:59:36.430574+00:00"} {"global_step": 232876, "acc_step": 0, "speed/wps": 5517.088825125988, "speed/FLOPS": 243827087050032.44, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04330616444349289, "optim/lr": 2.172675370374644e-05, "optim/total_tokens": 1953505476608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2762174606323242, "created_at": "2025-06-03T05:59:39.403500+00:00"} {"global_step": 232877, "acc_step": 0, "speed/wps": 5512.703497565714, "speed/FLOPS": 243633278018009.6, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04856747016310692, "optim/lr": 2.172320647865189e-05, "optim/total_tokens": 1953513865216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2841421365737915, "created_at": "2025-06-03T05:59:42.379011+00:00"} {"global_step": 232878, "acc_step": 0, "speed/wps": 5518.020537704999, "speed/FLOPS": 243868263977087.44, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04809514433145523, "optim/lr": 2.1719659253557344e-05, "optim/total_tokens": 1953522253824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.284507393836975, "created_at": "2025-06-03T05:59:45.354452+00:00"} {"global_step": 232879, "acc_step": 0, "speed/wps": 5513.796519041717, "speed/FLOPS": 243681583972657.84, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04293915629386902, "optim/lr": 2.171611202846302e-05, "optim/total_tokens": 1953530642432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.291778802871704, "created_at": "2025-06-03T05:59:48.329856+00:00"} {"global_step": 232880, "acc_step": 0, "speed/wps": 5519.340734527004, "speed/FLOPS": 243926609919240.2, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043038155883550644, "optim/lr": 2.1712564803368474e-05, "optim/total_tokens": 1953539031040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2918658256530762, "created_at": "2025-06-03T05:59:51.305149+00:00"} {"global_step": 232881, "acc_step": 0, "speed/wps": 5521.686351812078, "speed/FLOPS": 244030274197282.8, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04300544038414955, "optim/lr": 2.1709017578273928e-05, "optim/total_tokens": 1953547419648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2822232246398926, "created_at": "2025-06-03T05:59:54.276455+00:00"} {"global_step": 232882, "acc_step": 0, "speed/wps": 5525.334749926406, "speed/FLOPS": 244191514719741.72, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04291434958577156, "optim/lr": 2.1705470353179378e-05, "optim/total_tokens": 1953555808256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2909176349639893, "created_at": "2025-06-03T05:59:57.248023+00:00"} {"global_step": 232883, "acc_step": 0, "speed/wps": 5515.452319417495, "speed/FLOPS": 243754761874112.62, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04353421926498413, "optim/lr": 2.1701923128085055e-05, "optim/total_tokens": 1953564196864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2838492393493652, "created_at": "2025-06-03T06:00:00.225254+00:00"} {"global_step": 232884, "acc_step": 0, "speed/wps": 5516.072351347194, "speed/FLOPS": 243782164111794.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04340684786438942, "optim/lr": 2.169837590299051e-05, "optim/total_tokens": 1953572585472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2938278913497925, "created_at": "2025-06-03T06:00:03.201254+00:00"} {"global_step": 232885, "acc_step": 0, "speed/wps": 5513.494905812312, "speed/FLOPS": 243668254211714.6, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04373999312520027, "optim/lr": 2.1694828677895963e-05, "optim/total_tokens": 1953580974080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.277833342552185, "created_at": "2025-06-03T06:00:06.176362+00:00"} {"global_step": 232886, "acc_step": 0, "speed/wps": 5512.587547749103, "speed/FLOPS": 243628153629600.34, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048424169421195984, "optim/lr": 2.1691281452801416e-05, "optim/total_tokens": 1953589362688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.281506896018982, "created_at": "2025-06-03T06:00:09.152093+00:00"} {"global_step": 232887, "acc_step": 0, "speed/wps": 5525.501345124979, "speed/FLOPS": 244198877374807.1, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04388386011123657, "optim/lr": 2.168773422770709e-05, "optim/total_tokens": 1953597751296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2733371257781982, "created_at": "2025-06-03T06:00:12.121332+00:00"} {"global_step": 232888, "acc_step": 0, "speed/wps": 5533.310103479383, "speed/FLOPS": 244543984525223.22, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.47, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04505087435245514, "optim/lr": 2.1684187002612544e-05, "optim/total_tokens": 1953606139904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2908300161361694, "created_at": "2025-06-03T06:00:15.085803+00:00"} {"global_step": 232889, "acc_step": 0, "speed/wps": 5524.497046152745, "speed/FLOPS": 244154492500702.47, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.69, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043842848390340805, "optim/lr": 2.1680639777517997e-05, "optim/total_tokens": 1953614528512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2921819686889648, "created_at": "2025-06-03T06:00:18.058337+00:00"} {"global_step": 232890, "acc_step": 0, "speed/wps": 5538.754842222824, "speed/FLOPS": 244784614108984.06, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.28, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04620421677827835, "optim/lr": 2.167709255242345e-05, "optim/total_tokens": 1953622917120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2936699390411377, "created_at": "2025-06-03T06:00:21.020121+00:00"} {"global_step": 232891, "acc_step": 0, "speed/wps": 5524.598514197428, "speed/FLOPS": 244158976868916.94, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.77, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04183517396450043, "optim/lr": 2.1673545327329125e-05, "optim/total_tokens": 1953631305728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2730543613433838, "created_at": "2025-06-03T06:00:23.988974+00:00"} {"global_step": 232892, "acc_step": 0, "speed/wps": 5519.443058323183, "speed/FLOPS": 243931132107290.62, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04401916638016701, "optim/lr": 2.1669998102234578e-05, "optim/total_tokens": 1953639694336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2972285747528076, "created_at": "2025-06-03T06:00:26.963546+00:00"} {"global_step": 232893, "acc_step": 0, "speed/wps": 5529.365207027123, "speed/FLOPS": 244369640293843.8, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04345332086086273, "optim/lr": 2.1666450877140032e-05, "optim/total_tokens": 1953648082944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.3000761270523071, "created_at": "2025-06-03T06:00:29.934178+00:00"} {"global_step": 232894, "acc_step": 0, "speed/wps": 5506.63806191348, "speed/FLOPS": 243365216807894.88, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04332207515835762, "optim/lr": 2.1662903652045706e-05, "optim/total_tokens": 1953656471552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.302754521369934, "created_at": "2025-06-03T06:00:32.914161+00:00"} {"global_step": 232895, "acc_step": 0, "speed/wps": 5512.658354503337, "speed/FLOPS": 243631282925715.7, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04307672381401062, "optim/lr": 2.165935642695116e-05, "optim/total_tokens": 1953664860160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.27556574344635, "created_at": "2025-06-03T06:00:35.890281+00:00"} {"global_step": 232896, "acc_step": 0, "speed/wps": 5501.040051404812, "speed/FLOPS": 243117813396627.03, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.05 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.05, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043223410844802856, "optim/lr": 2.1655809201856613e-05, "optim/total_tokens": 1953673248768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.295147180557251, "created_at": "2025-06-03T06:00:38.871780+00:00"} {"global_step": 232897, "acc_step": 0, "speed/wps": 5519.4208572524, "speed/FLOPS": 243930150933597.4, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04385277256369591, "optim/lr": 2.1652261976762067e-05, "optim/total_tokens": 1953681637376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2755801677703857, "created_at": "2025-06-03T06:00:41.843497+00:00"} {"global_step": 232898, "acc_step": 0, "speed/wps": 5528.669858173295, "speed/FLOPS": 244338909433622.72, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04457084834575653, "optim/lr": 2.164871475166774e-05, "optim/total_tokens": 1953690025984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.3065811395645142, "created_at": "2025-06-03T06:00:44.811839+00:00"} {"global_step": 232899, "acc_step": 0, "speed/wps": 5516.517345774905, "speed/FLOPS": 243801830587811.1, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04282072186470032, "optim/lr": 2.1645167526573194e-05, "optim/total_tokens": 1953698414592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3069367408752441, "created_at": "2025-06-03T06:00:47.787091+00:00"} {"global_step": 232900, "acc_step": 0, "speed/wps": 5516.066261942927, "speed/FLOPS": 243781894991294.0, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042552974075078964, "optim/lr": 2.1641620301478648e-05, "optim/total_tokens": 1953706803200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2881228923797607, "created_at": "2025-06-03T06:00:50.760568+00:00"} {"global_step": 232901, "acc_step": 0, "speed/wps": 5525.647728529002, "speed/FLOPS": 244205346772006.72, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045616354793310165, "optim/lr": 2.16380730763841e-05, "optim/total_tokens": 1953715191808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2878328561782837, "created_at": "2025-06-03T06:00:53.729136+00:00"} {"global_step": 232902, "acc_step": 0, "speed/wps": 5507.740639792236, "speed/FLOPS": 243413945106630.72, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.04 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.04, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0478161945939064, "optim/lr": 2.163452585128978e-05, "optim/total_tokens": 1953723580416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2902294397354126, "created_at": "2025-06-03T06:00:56.709620+00:00"} {"global_step": 232903, "acc_step": 0, "speed/wps": 5512.1771186062115, "speed/FLOPS": 243610014762251.34, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04368910193443298, "optim/lr": 2.163097862619523e-05, "optim/total_tokens": 1953731969024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2814631462097168, "created_at": "2025-06-03T06:00:59.688028+00:00"} {"global_step": 232904, "acc_step": 0, "speed/wps": 5515.641417903369, "speed/FLOPS": 243763119059294.47, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04493590071797371, "optim/lr": 2.1627431401100682e-05, "optim/total_tokens": 1953740357632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2979928255081177, "created_at": "2025-06-03T06:01:02.665941+00:00"} {"global_step": 232905, "acc_step": 0, "speed/wps": 5516.9120607501845, "speed/FLOPS": 243819274969384.03, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04333237558603287, "optim/lr": 2.1623884176006136e-05, "optim/total_tokens": 1953748746240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2902755737304688, "created_at": "2025-06-03T06:01:05.638826+00:00"} {"global_step": 232906, "acc_step": 0, "speed/wps": 5510.169286140735, "speed/FLOPS": 243521278844295.44, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045019544661045074, "optim/lr": 2.1620336950911813e-05, "optim/total_tokens": 1953757134848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2885265350341797, "created_at": "2025-06-03T06:01:08.615574+00:00"} {"global_step": 232907, "acc_step": 0, "speed/wps": 5512.128757065588, "speed/FLOPS": 243607877429692.56, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.22, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.041968945413827896, "optim/lr": 2.1616789725817267e-05, "optim/total_tokens": 1953765523456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2943881750106812, "created_at": "2025-06-03T06:01:11.593065+00:00"} {"global_step": 232908, "acc_step": 0, "speed/wps": 5519.748576911414, "speed/FLOPS": 243944634465104.5, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045513324439525604, "optim/lr": 2.1613242500722717e-05, "optim/total_tokens": 1953773912064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2890851497650146, "created_at": "2025-06-03T06:01:14.564653+00:00"} {"global_step": 232909, "acc_step": 0, "speed/wps": 5523.201344381717, "speed/FLOPS": 244097229114425.9, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042557746171951294, "optim/lr": 2.160969527562817e-05, "optim/total_tokens": 1953782300672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.3075568675994873, "created_at": "2025-06-03T06:01:17.535248+00:00"} {"global_step": 232910, "acc_step": 0, "speed/wps": 5523.729650229484, "speed/FLOPS": 244120577528782.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04769578576087952, "optim/lr": 2.1606148050533848e-05, "optim/total_tokens": 1953790689280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2909941673278809, "created_at": "2025-06-03T06:01:20.507285+00:00"} {"global_step": 232911, "acc_step": 0, "speed/wps": 5510.467866256142, "speed/FLOPS": 243534474557124.88, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.03 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.03, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04341086000204086, "optim/lr": 2.16026008254393e-05, "optim/total_tokens": 1953799077888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2850819826126099, "created_at": "2025-06-03T06:01:23.483792+00:00"} {"global_step": 232912, "acc_step": 0, "speed/wps": 5524.058738666102, "speed/FLOPS": 244135121553253.94, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04544210433959961, "optim/lr": 2.1599053600344755e-05, "optim/total_tokens": 1953807466496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.3025940656661987, "created_at": "2025-06-03T06:01:26.455989+00:00"} {"global_step": 232913, "acc_step": 0, "speed/wps": 5522.068633444084, "speed/FLOPS": 244047169088722.72, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04371560364961624, "optim/lr": 2.1595506375250205e-05, "optim/total_tokens": 1953815855104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2840770483016968, "created_at": "2025-06-03T06:01:29.426378+00:00"} {"global_step": 232914, "acc_step": 0, "speed/wps": 5528.8371119713265, "speed/FLOPS": 244346301195413.16, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04708188399672508, "optim/lr": 2.1591959150155882e-05, "optim/total_tokens": 1953824243712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3024332523345947, "created_at": "2025-06-03T06:01:32.397086+00:00"} {"global_step": 232915, "acc_step": 0, "speed/wps": 5519.369668884045, "speed/FLOPS": 243927888669721.9, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04761834815144539, "optim/lr": 2.1588411925061336e-05, "optim/total_tokens": 1953832632320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.287427306175232, "created_at": "2025-06-03T06:01:35.369724+00:00"} {"global_step": 232916, "acc_step": 0, "speed/wps": 5514.378468736698, "speed/FLOPS": 243707303170487.44, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04421664774417877, "optim/lr": 2.158486469996679e-05, "optim/total_tokens": 1953841020928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.293058156967163, "created_at": "2025-06-03T06:01:38.348242+00:00"} {"global_step": 232917, "acc_step": 0, "speed/wps": 5514.496105382586, "speed/FLOPS": 243712502108116.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04714095965027809, "optim/lr": 2.1581317474872243e-05, "optim/total_tokens": 1953849409536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2763595581054688, "created_at": "2025-06-03T06:01:41.322786+00:00"} {"global_step": 232918, "acc_step": 0, "speed/wps": 5526.827938985637, "speed/FLOPS": 244257506033325.25, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043723542243242264, "optim/lr": 2.1577770249777917e-05, "optim/total_tokens": 1953857798144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.285568356513977, "created_at": "2025-06-03T06:01:44.292845+00:00"} {"global_step": 232919, "acc_step": 0, "speed/wps": 5508.498061647681, "speed/FLOPS": 243447419275804.9, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04484139755368233, "optim/lr": 2.157422302468337e-05, "optim/total_tokens": 1953866186752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.292434811592102, "created_at": "2025-06-03T06:01:47.271520+00:00"} {"global_step": 232920, "acc_step": 0, "speed/wps": 5508.63326456397, "speed/FLOPS": 243453394552673.62, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.02 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.02, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043388593941926956, "optim/lr": 2.1570675799588824e-05, "optim/total_tokens": 1953874575360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.280844807624817, "created_at": "2025-06-03T06:01:50.252170+00:00"} {"global_step": 232921, "acc_step": 0, "speed/wps": 5518.352332056191, "speed/FLOPS": 243882927589132.7, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0433829128742218, "optim/lr": 2.1567128574494278e-05, "optim/total_tokens": 1953882963968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2767199277877808, "created_at": "2025-06-03T06:01:53.228875+00:00"} {"global_step": 232922, "acc_step": 0, "speed/wps": 5520.530921303024, "speed/FLOPS": 243979210082812.1, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045747868716716766, "optim/lr": 2.156358134939995e-05, "optim/total_tokens": 1953891352576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2907413244247437, "created_at": "2025-06-03T06:01:56.201021+00:00"} {"global_step": 232923, "acc_step": 0, "speed/wps": 5521.331794422535, "speed/FLOPS": 244014604575454.22, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04734564945101738, "optim/lr": 2.1560034124305405e-05, "optim/total_tokens": 1953899741184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2853944301605225, "created_at": "2025-06-03T06:01:59.174269+00:00"} {"global_step": 232924, "acc_step": 0, "speed/wps": 5521.442751504097, "speed/FLOPS": 244019508310529.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04410732537508011, "optim/lr": 2.155648689921086e-05, "optim/total_tokens": 1953908129792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2863479852676392, "created_at": "2025-06-03T06:02:02.144942+00:00"} {"global_step": 232925, "acc_step": 0, "speed/wps": 5532.201040686499, "speed/FLOPS": 244494969626475.75, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04705024138092995, "optim/lr": 2.1552939674116533e-05, "optim/total_tokens": 1953916518400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2915759086608887, "created_at": "2025-06-03T06:02:05.110123+00:00"} {"global_step": 232926, "acc_step": 0, "speed/wps": 5519.547483504191, "speed/FLOPS": 243935747165794.66, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0431131012737751, "optim/lr": 2.1549392449021986e-05, "optim/total_tokens": 1953924907008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2792112827301025, "created_at": "2025-06-03T06:02:08.083210+00:00"} {"global_step": 232927, "acc_step": 0, "speed/wps": 5524.034507855035, "speed/FLOPS": 244134050675429.34, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04964038357138634, "optim/lr": 2.154584522392744e-05, "optim/total_tokens": 1953933295616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2963778972625732, "created_at": "2025-06-03T06:02:11.057456+00:00"} {"global_step": 232928, "acc_step": 0, "speed/wps": 5510.174771417714, "speed/FLOPS": 243521521265461.72, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.22, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045582715421915054, "optim/lr": 2.1542297998832894e-05, "optim/total_tokens": 1953941684224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2932884693145752, "created_at": "2025-06-03T06:02:14.039664+00:00"} {"global_step": 232929, "acc_step": 0, "speed/wps": 5510.404834536508, "speed/FLOPS": 243531688877742.66, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05551191046833992, "optim/lr": 2.1538750773738567e-05, "optim/total_tokens": 1953950072832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2855184078216553, "created_at": "2025-06-03T06:02:17.021286+00:00"} {"global_step": 232930, "acc_step": 0, "speed/wps": 5528.586139944418, "speed/FLOPS": 244335209516415.1, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04287487640976906, "optim/lr": 2.153520354864402e-05, "optim/total_tokens": 1953958461440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2956193685531616, "created_at": "2025-06-03T06:02:19.991522+00:00"} {"global_step": 232931, "acc_step": 0, "speed/wps": 5526.094958869982, "speed/FLOPS": 244225112063945.66, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.047590095549821854, "optim/lr": 2.1531656323549475e-05, "optim/total_tokens": 1953966850048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2954436540603638, "created_at": "2025-06-03T06:02:22.959717+00:00"} {"global_step": 232932, "acc_step": 0, "speed/wps": 5515.2203528519785, "speed/FLOPS": 243744510139229.3, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04277272894978523, "optim/lr": 2.1528109098454928e-05, "optim/total_tokens": 1953975238656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2837142944335938, "created_at": "2025-06-03T06:02:25.934283+00:00"} {"global_step": 232933, "acc_step": 0, "speed/wps": 5510.604061326669, "speed/FLOPS": 243540493682132.6, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05158437788486481, "optim/lr": 2.1524561873360605e-05, "optim/total_tokens": 1953983627264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3011318445205688, "created_at": "2025-06-03T06:02:28.910569+00:00"} {"global_step": 232934, "acc_step": 0, "speed/wps": 5513.782569010951, "speed/FLOPS": 243680967452700.72, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04394465684890747, "optim/lr": 2.152101464826606e-05, "optim/total_tokens": 1953992015872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2906121015548706, "created_at": "2025-06-03T06:02:31.887186+00:00"} {"global_step": 232935, "acc_step": 0, "speed/wps": 5509.500633173025, "speed/FLOPS": 243491727805598.8, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04321502521634102, "optim/lr": 2.151746742317151e-05, "optim/total_tokens": 1954000404480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.289598822593689, "created_at": "2025-06-03T06:02:34.866044+00:00"} {"global_step": 232936, "acc_step": 0, "speed/wps": 5523.107543770194, "speed/FLOPS": 244093083607511.66, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04214410483837128, "optim/lr": 2.1513920198076963e-05, "optim/total_tokens": 1954008793088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2866690158843994, "created_at": "2025-06-03T06:02:37.842196+00:00"} {"global_step": 232937, "acc_step": 0, "speed/wps": 5507.9443934582005, "speed/FLOPS": 243422949975760.53, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042691100388765335, "optim/lr": 2.151037297298264e-05, "optim/total_tokens": 1954017181696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2828598022460938, "created_at": "2025-06-03T06:02:40.820339+00:00"} {"global_step": 232938, "acc_step": 0, "speed/wps": 5500.756010262511, "speed/FLOPS": 243105260231991.7, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.01 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.01, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0441545732319355, "optim/lr": 2.1506825747888094e-05, "optim/total_tokens": 1954025570304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.305991291999817, "created_at": "2025-06-03T06:02:43.802808+00:00"} {"global_step": 232939, "acc_step": 0, "speed/wps": 5524.94367857631, "speed/FLOPS": 244174231367752.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04270736873149872, "optim/lr": 2.1503278522793547e-05, "optim/total_tokens": 1954033958912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2596040964126587, "created_at": "2025-06-03T06:02:46.772346+00:00"} {"global_step": 232940, "acc_step": 0, "speed/wps": 5513.64902962855, "speed/FLOPS": 243675065695515.12, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043213747441768646, "optim/lr": 2.1499731297698998e-05, "optim/total_tokens": 1954042347520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.29936945438385, "created_at": "2025-06-03T06:02:49.747591+00:00"} {"global_step": 232941, "acc_step": 0, "speed/wps": 5527.1642252147685, "speed/FLOPS": 244272368163383.9, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04308665916323662, "optim/lr": 2.1496184072604675e-05, "optim/total_tokens": 1954050736128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.290549635887146, "created_at": "2025-06-03T06:02:52.715015+00:00"} {"global_step": 232942, "acc_step": 0, "speed/wps": 5514.9283090898425, "speed/FLOPS": 243731603299758.38, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044369421899318695, "optim/lr": 2.149263684751013e-05, "optim/total_tokens": 1954059124736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2892850637435913, "created_at": "2025-06-03T06:02:55.689380+00:00"} {"global_step": 232943, "acc_step": 0, "speed/wps": 5506.26567084036, "speed/FLOPS": 243348759028533.28, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04248771816492081, "optim/lr": 2.1489089622415582e-05, "optim/total_tokens": 1954067513344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2899858951568604, "created_at": "2025-06-03T06:02:58.668069+00:00"} {"global_step": 232944, "acc_step": 0, "speed/wps": 5513.796951079475, "speed/FLOPS": 243681603066515.38, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04772947356104851, "optim/lr": 2.1485542397321036e-05, "optim/total_tokens": 1954075901952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.282057523727417, "created_at": "2025-06-03T06:03:01.643227+00:00"} {"global_step": 232945, "acc_step": 0, "speed/wps": 5505.561699948964, "speed/FLOPS": 243317647118383.25, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04540912061929703, "optim/lr": 2.148199517222671e-05, "optim/total_tokens": 1954084290560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2928344011306763, "created_at": "2025-06-03T06:03:04.622422+00:00"} {"global_step": 232946, "acc_step": 0, "speed/wps": 5519.673861419123, "speed/FLOPS": 243941332422773.8, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04449378699064255, "optim/lr": 2.1478447947132163e-05, "optim/total_tokens": 1954092679168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2885743379592896, "created_at": "2025-06-03T06:03:07.593902+00:00"} {"global_step": 232947, "acc_step": 0, "speed/wps": 5523.315692692889, "speed/FLOPS": 244102282724492.0, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0450490303337574, "optim/lr": 2.1474900722037617e-05, "optim/total_tokens": 1954101067776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2988098859786987, "created_at": "2025-06-03T06:03:10.567846+00:00"} {"global_step": 232948, "acc_step": 0, "speed/wps": 5516.224533311868, "speed/FLOPS": 243788889775694.9, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04451751708984375, "optim/lr": 2.147135349694307e-05, "optim/total_tokens": 1954109456384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2912192344665527, "created_at": "2025-06-03T06:03:13.541597+00:00"} {"global_step": 232949, "acc_step": 0, "speed/wps": 5527.013474597905, "speed/FLOPS": 244265705757730.16, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043979790061712265, "optim/lr": 2.1467806271848744e-05, "optim/total_tokens": 1954117844992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2988793849945068, "created_at": "2025-06-03T06:03:16.509299+00:00"} {"global_step": 232950, "acc_step": 0, "speed/wps": 5499.006991465516, "speed/FLOPS": 243027962553454.25, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04302440583705902, "optim/lr": 2.1464259046754198e-05, "optim/total_tokens": 1954126233600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2750216722488403, "created_at": "2025-06-03T06:03:19.492251+00:00"} {"global_step": 232951, "acc_step": 0, "speed/wps": 5512.410802663494, "speed/FLOPS": 243620342401479.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04393612965941429, "optim/lr": 2.146071182165965e-05, "optim/total_tokens": 1954134622208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2992441654205322, "created_at": "2025-06-03T06:03:22.467613+00:00"} {"global_step": 232952, "acc_step": 0, "speed/wps": 5501.322331867837, "speed/FLOPS": 243130288748250.34, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "5.0 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 5.0, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04339130222797394, "optim/lr": 2.1457164596565325e-05, "optim/total_tokens": 1954143010816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2840495109558105, "created_at": "2025-06-03T06:03:25.452803+00:00"} {"global_step": 232953, "acc_step": 0, "speed/wps": 5515.035166836622, "speed/FLOPS": 243736325865218.5, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046093299984931946, "optim/lr": 2.145361737147078e-05, "optim/total_tokens": 1954151399424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.290574550628662, "created_at": "2025-06-03T06:03:28.427292+00:00"} {"global_step": 232954, "acc_step": 0, "speed/wps": 5507.242383238818, "speed/FLOPS": 243391924717277.84, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042293012142181396, "optim/lr": 2.1450070146376232e-05, "optim/total_tokens": 1954159788032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.289320468902588, "created_at": "2025-06-03T06:03:31.405168+00:00"} {"global_step": 232955, "acc_step": 0, "speed/wps": 5518.723817069862, "speed/FLOPS": 243899345325304.28, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04519252851605415, "optim/lr": 2.1446522921281686e-05, "optim/total_tokens": 1954168176640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.296910047531128, "created_at": "2025-06-03T06:03:34.380211+00:00"} {"global_step": 232956, "acc_step": 0, "speed/wps": 5537.37848224337, "speed/FLOPS": 244723786042741.22, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.38, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04305485635995865, "optim/lr": 2.144297569618736e-05, "optim/total_tokens": 1954176565248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2831249237060547, "created_at": "2025-06-03T06:03:37.342360+00:00"} {"global_step": 232957, "acc_step": 0, "speed/wps": 5518.7168129107495, "speed/FLOPS": 243899035777322.06, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042807940393686295, "optim/lr": 2.1439428471092813e-05, "optim/total_tokens": 1954184953856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2855021953582764, "created_at": "2025-06-03T06:03:40.314836+00:00"} {"global_step": 232958, "acc_step": 0, "speed/wps": 5525.293875693157, "speed/FLOPS": 244189708287845.38, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.73, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04268043488264084, "optim/lr": 2.1435881245998267e-05, "optim/total_tokens": 1954193342464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2869940996170044, "created_at": "2025-06-03T06:03:43.283584+00:00"} {"global_step": 232959, "acc_step": 0, "speed/wps": 5524.285827910658, "speed/FLOPS": 244145157735515.2, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04232246056199074, "optim/lr": 2.143233402090372e-05, "optim/total_tokens": 1954201731072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2857012748718262, "created_at": "2025-06-03T06:03:46.252797+00:00"} {"global_step": 232960, "acc_step": 0, "speed/wps": 5512.788903934601, "speed/FLOPS": 243637052542364.97, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04308637976646423, "optim/lr": 2.1428786795809398e-05, "optim/total_tokens": 1954210119680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2907447814941406, "created_at": "2025-06-03T06:03:49.227931+00:00"} {"global_step": 232961, "acc_step": 0, "speed/wps": 5517.685150308052, "speed/FLOPS": 243853441570810.7, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0431143157184124, "optim/lr": 2.1425239570714848e-05, "optim/total_tokens": 1954218508288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2764407396316528, "created_at": "2025-06-03T06:03:52.200793+00:00"} {"global_step": 232962, "acc_step": 0, "speed/wps": 5501.734958920805, "speed/FLOPS": 243148524751974.8, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.99 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.99, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0427432619035244, "optim/lr": 2.14216923456203e-05, "optim/total_tokens": 1954226896896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2912380695343018, "created_at": "2025-06-03T06:03:55.186781+00:00"} {"global_step": 232963, "acc_step": 0, "speed/wps": 5526.43758287969, "speed/FLOPS": 244240254291466.1, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04292130470275879, "optim/lr": 2.1418145120525755e-05, "optim/total_tokens": 1954235285504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2873196601867676, "created_at": "2025-06-03T06:03:58.154549+00:00"} {"global_step": 232964, "acc_step": 0, "speed/wps": 5525.68955130387, "speed/FLOPS": 244207195124587.53, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0464390367269516, "optim/lr": 2.1414597895431432e-05, "optim/total_tokens": 1954243674112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2922565937042236, "created_at": "2025-06-03T06:04:01.126846+00:00"} {"global_step": 232965, "acc_step": 0, "speed/wps": 5514.549296753935, "speed/FLOPS": 243714852894472.25, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04461408033967018, "optim/lr": 2.1411050670336886e-05, "optim/total_tokens": 1954252062720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2968087196350098, "created_at": "2025-06-03T06:04:04.101153+00:00"} {"global_step": 232966, "acc_step": 0, "speed/wps": 5520.4426802998005, "speed/FLOPS": 243975310282128.0, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043156158179044724, "optim/lr": 2.1407503445242336e-05, "optim/total_tokens": 1954260451328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2935242652893066, "created_at": "2025-06-03T06:04:07.073658+00:00"} {"global_step": 232967, "acc_step": 0, "speed/wps": 5518.991537035739, "speed/FLOPS": 243911177177481.06, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04629941284656525, "optim/lr": 2.140395622014779e-05, "optim/total_tokens": 1954268839936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2861815690994263, "created_at": "2025-06-03T06:04:10.051057+00:00"} {"global_step": 232968, "acc_step": 0, "speed/wps": 5508.3071592062815, "speed/FLOPS": 243438982365022.3, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.98 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.98, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04412604495882988, "optim/lr": 2.1400408995053467e-05, "optim/total_tokens": 1954277228544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2758487462997437, "created_at": "2025-06-03T06:04:13.030597+00:00"} {"global_step": 232969, "acc_step": 0, "speed/wps": 5513.353772526367, "speed/FLOPS": 243662016842861.47, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04375742748379707, "optim/lr": 2.139686176995892e-05, "optim/total_tokens": 1954285617152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.28428316116333, "created_at": "2025-06-03T06:04:16.005469+00:00"} {"global_step": 232970, "acc_step": 0, "speed/wps": 5511.596454936481, "speed/FLOPS": 243584352400155.34, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043502215296030045, "optim/lr": 2.1393314544864374e-05, "optim/total_tokens": 1954294005760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2809770107269287, "created_at": "2025-06-03T06:04:18.982116+00:00"} {"global_step": 232971, "acc_step": 0, "speed/wps": 5525.255153886845, "speed/FLOPS": 244187996982202.56, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04396340623497963, "optim/lr": 2.1389767319769825e-05, "optim/total_tokens": 1954302394368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3093308210372925, "created_at": "2025-06-03T06:04:21.953887+00:00"} {"global_step": 232972, "acc_step": 0, "speed/wps": 5518.739303929082, "speed/FLOPS": 243900029765212.88, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.044212792068719864, "optim/lr": 2.1386220094675502e-05, "optim/total_tokens": 1954310782976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2910820245742798, "created_at": "2025-06-03T06:04:24.926001+00:00"} {"global_step": 232973, "acc_step": 0, "speed/wps": 5525.698239801394, "speed/FLOPS": 244207579111706.34, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04380965977907181, "optim/lr": 2.1382672869580955e-05, "optim/total_tokens": 1954319171584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2967498302459717, "created_at": "2025-06-03T06:04:27.894262+00:00"} {"global_step": 232974, "acc_step": 0, "speed/wps": 5522.311525812705, "speed/FLOPS": 244057903688179.94, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043397314846515656, "optim/lr": 2.137912564448641e-05, "optim/total_tokens": 1954327560192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2872613668441772, "created_at": "2025-06-03T06:04:30.864307+00:00"} {"global_step": 232975, "acc_step": 0, "speed/wps": 5526.072454725557, "speed/FLOPS": 244224117495948.72, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04240050166845322, "optim/lr": 2.1375578419391863e-05, "optim/total_tokens": 1954335948800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2705084085464478, "created_at": "2025-06-03T06:04:33.833941+00:00"} {"global_step": 232976, "acc_step": 0, "speed/wps": 5531.846695081593, "speed/FLOPS": 244479309364444.1, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04314570128917694, "optim/lr": 2.1372031194297536e-05, "optim/total_tokens": 1954344337408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.293067216873169, "created_at": "2025-06-03T06:04:36.799954+00:00"} {"global_step": 232977, "acc_step": 0, "speed/wps": 5508.431587456456, "speed/FLOPS": 243444481456798.5, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04294499382376671, "optim/lr": 2.136848396920299e-05, "optim/total_tokens": 1954352726016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2922149896621704, "created_at": "2025-06-03T06:04:39.780976+00:00"} {"global_step": 232978, "acc_step": 0, "speed/wps": 5512.096981527739, "speed/FLOPS": 243606473113561.62, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045069482177495956, "optim/lr": 2.1364936744108444e-05, "optim/total_tokens": 1954361114624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2910218238830566, "created_at": "2025-06-03T06:04:42.758319+00:00"} {"global_step": 232979, "acc_step": 0, "speed/wps": 5507.619825809015, "speed/FLOPS": 243408605746954.38, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042763203382492065, "optim/lr": 2.1361389519014117e-05, "optim/total_tokens": 1954369503232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2833051681518555, "created_at": "2025-06-03T06:04:45.737302+00:00"} {"global_step": 232980, "acc_step": 0, "speed/wps": 5514.499182273534, "speed/FLOPS": 243712638090947.7, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04363541305065155, "optim/lr": 2.135784229391957e-05, "optim/total_tokens": 1954377891840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.272735595703125, "created_at": "2025-06-03T06:04:48.714684+00:00"} {"global_step": 232981, "acc_step": 0, "speed/wps": 5520.684480254349, "speed/FLOPS": 243985996602474.7, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046843960881233215, "optim/lr": 2.1354295068825025e-05, "optim/total_tokens": 1954386280448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.268964171409607, "created_at": "2025-06-03T06:04:51.685720+00:00"} {"global_step": 232982, "acc_step": 0, "speed/wps": 5514.531496318082, "speed/FLOPS": 243714066206318.44, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042338598519563675, "optim/lr": 2.1350747843730478e-05, "optim/total_tokens": 1954394669056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2734167575836182, "created_at": "2025-06-03T06:04:54.662805+00:00"} {"global_step": 232983, "acc_step": 0, "speed/wps": 5515.944060736764, "speed/FLOPS": 243776494323464.1, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04210374504327774, "optim/lr": 2.1347200618636152e-05, "optim/total_tokens": 1954403057664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2876977920532227, "created_at": "2025-06-03T06:04:57.636687+00:00"} {"global_step": 232984, "acc_step": 0, "speed/wps": 5514.896062573733, "speed/FLOPS": 243730178168798.97, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04402961954474449, "optim/lr": 2.1343653393541606e-05, "optim/total_tokens": 1954411446272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.28651762008667, "created_at": "2025-06-03T06:05:00.614565+00:00"} {"global_step": 232985, "acc_step": 0, "speed/wps": 5508.1169503479105, "speed/FLOPS": 243430576107059.5, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.048157189041376114, "optim/lr": 2.134010616844706e-05, "optim/total_tokens": 1954419834880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2945194244384766, "created_at": "2025-06-03T06:05:03.592286+00:00"} {"global_step": 232986, "acc_step": 0, "speed/wps": 5519.669281146892, "speed/FLOPS": 243941129998185.16, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04435542970895767, "optim/lr": 2.1336558943352513e-05, "optim/total_tokens": 1954428223488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2996799945831299, "created_at": "2025-06-03T06:05:06.564086+00:00"} {"global_step": 232987, "acc_step": 0, "speed/wps": 5503.938545669446, "speed/FLOPS": 243245912007285.3, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.97 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.97, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05208612605929375, "optim/lr": 2.1333011718258187e-05, "optim/total_tokens": 1954436612096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2817745208740234, "created_at": "2025-06-03T06:05:09.544489+00:00"} {"global_step": 232988, "acc_step": 0, "speed/wps": 5531.63232023713, "speed/FLOPS": 244469835093588.78, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.047100652009248734, "optim/lr": 2.132946449316364e-05, "optim/total_tokens": 1954445000704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2821186780929565, "created_at": "2025-06-03T06:05:12.509514+00:00"} {"global_step": 232989, "acc_step": 0, "speed/wps": 5524.682083941673, "speed/FLOPS": 244162670223863.84, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042626842856407166, "optim/lr": 2.1325917268069094e-05, "optim/total_tokens": 1954453389312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2845079898834229, "created_at": "2025-06-03T06:05:15.478709+00:00"} {"global_step": 232990, "acc_step": 0, "speed/wps": 5520.276023633451, "speed/FLOPS": 243967944910501.5, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04290351644158363, "optim/lr": 2.1322370042974548e-05, "optim/total_tokens": 1954461777920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.285570740699768, "created_at": "2025-06-03T06:05:18.449890+00:00"} {"global_step": 232991, "acc_step": 0, "speed/wps": 5519.466705980508, "speed/FLOPS": 243932177212704.7, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05347931757569313, "optim/lr": 2.1318822817880225e-05, "optim/total_tokens": 1954470166528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.279413104057312, "created_at": "2025-06-03T06:05:21.423844+00:00"} {"global_step": 232992, "acc_step": 0, "speed/wps": 5513.052090680922, "speed/FLOPS": 243648684049440.5, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05158676207065582, "optim/lr": 2.131527559278568e-05, "optim/total_tokens": 1954478555136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.287440538406372, "created_at": "2025-06-03T06:05:24.399166+00:00"} {"global_step": 232993, "acc_step": 0, "speed/wps": 5510.571340615977, "speed/FLOPS": 243539047594199.78, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.045236214995384216, "optim/lr": 2.131172836769113e-05, "optim/total_tokens": 1954486943744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.287024974822998, "created_at": "2025-06-03T06:05:27.378217+00:00"} {"global_step": 232994, "acc_step": 0, "speed/wps": 5519.725625647998, "speed/FLOPS": 243943620136736.75, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04352980852127075, "optim/lr": 2.1308181142596582e-05, "optim/total_tokens": 1954495332352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2970157861709595, "created_at": "2025-06-03T06:05:30.349654+00:00"} {"global_step": 232995, "acc_step": 0, "speed/wps": 5505.401834121075, "speed/FLOPS": 243310581867058.03, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.06024688482284546, "optim/lr": 2.130463391750226e-05, "optim/total_tokens": 1954503720960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2833372354507446, "created_at": "2025-06-03T06:05:33.328780+00:00"} {"global_step": 232996, "acc_step": 0, "speed/wps": 5509.926450717461, "speed/FLOPS": 243510546761531.12, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.96 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.96, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04924570769071579, "optim/lr": 2.1301086692407713e-05, "optim/total_tokens": 1954512109568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3004207611083984, "created_at": "2025-06-03T06:05:36.305824+00:00"} {"global_step": 232997, "acc_step": 0, "speed/wps": 5525.1081540114865, "speed/FLOPS": 244181500340125.28, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05159037560224533, "optim/lr": 2.1297539467313167e-05, "optim/total_tokens": 1954520498176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2923431396484375, "created_at": "2025-06-03T06:05:39.278639+00:00"} {"global_step": 232998, "acc_step": 0, "speed/wps": 5520.4463406933855, "speed/FLOPS": 243975472052788.88, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04566766321659088, "optim/lr": 2.1293992242218617e-05, "optim/total_tokens": 1954528886784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.285339593887329, "created_at": "2025-06-03T06:05:42.250145+00:00"} {"global_step": 232999, "acc_step": 0, "speed/wps": 5524.817561102392, "speed/FLOPS": 244168657620932.66, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04645800217986107, "optim/lr": 2.1290445017124294e-05, "optim/total_tokens": 1954537275392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.292858600616455, "created_at": "2025-06-03T06:05:45.219969+00:00"} {"global_step": 233000, "acc_step": 0, "speed/wps": 5516.013572272499, "speed/FLOPS": 243779566377551.28, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04264691099524498, "optim/lr": 2.1286897792029748e-05, "optim/total_tokens": 1954545664000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.300639033317566, "created_at": "2025-06-03T06:05:48.195923+00:00"} {"global_step": 233001, "acc_step": 0, "speed/wps": 222.83384451048303, "speed/FLOPS": 9848115360352.242, "speed/curr_iter_time": 5.4361, "speed/data_load_time": 3.9206, "speed/curr_step_time": 5.4361, "speed/est_time_elapsed": "14.66 days", "speed/est_time_remaining": "9.06 hours", "speed/est_time_elapsed_hrs": 351.84, "speed/est_time_elapsed_days": 14.66, "speed/est_time_remaining_hrs": 9.06, "speed/est_time_remaining_days": 0.38, "optim/grad_norm": 0.05041760951280594, "optim/lr": 2.12833505669352e-05, "optim/total_tokens": 1954554052608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2821661233901978, "created_at": "2025-06-03T06:07:01.731104+00:00"} {"global_step": 233002, "acc_step": 0, "speed/wps": 5611.435222594625, "speed/FLOPS": 247996714909507.25, "speed/curr_iter_time": 2.9169, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9169, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "4.86 hours", "speed/est_time_elapsed_hrs": 188.79, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 4.86, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04568030312657356, "optim/lr": 2.1279803341840655e-05, "optim/total_tokens": 1954562441216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2852377891540527, "created_at": "2025-06-03T06:07:04.656609+00:00"} {"global_step": 233003, "acc_step": 0, "speed/wps": 5559.32254197176, "speed/FLOPS": 245693601162856.3, "speed/curr_iter_time": 2.9459, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9459, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 190.67, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05616367980837822, "optim/lr": 2.127625611674633e-05, "optim/total_tokens": 1954570829824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2702666521072388, "created_at": "2025-06-03T06:07:07.611688+00:00"} {"global_step": 233004, "acc_step": 0, "speed/wps": 5535.297416546764, "speed/FLOPS": 244631813590811.1, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 191.43, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.0458538644015789, "optim/lr": 2.1272708891651782e-05, "optim/total_tokens": 1954579218432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2873589992523193, "created_at": "2025-06-03T06:07:10.579237+00:00"} {"global_step": 233005, "acc_step": 0, "speed/wps": 5524.124171200661, "speed/FLOPS": 244138013336367.4, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.05531393364071846, "optim/lr": 2.1269161666557236e-05, "optim/total_tokens": 1954587607040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.294150948524475, "created_at": "2025-06-03T06:07:13.549201+00:00"} {"global_step": 233006, "acc_step": 0, "speed/wps": 5535.212890098999, "speed/FLOPS": 244628077954465.47, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 191.5, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04554949328303337, "optim/lr": 2.126561444146291e-05, "optim/total_tokens": 1954595995648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2816351652145386, "created_at": "2025-06-03T06:07:16.512523+00:00"} {"global_step": 233007, "acc_step": 0, "speed/wps": 5558.114498487201, "speed/FLOPS": 245640211824165.88, "speed/curr_iter_time": 2.9456, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9456, "speed/est_time_elapsed": "7.94 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 190.65, "speed/est_time_elapsed_days": 7.94, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046664465218782425, "optim/lr": 2.1262067216368363e-05, "optim/total_tokens": 1954604384256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2696654796600342, "created_at": "2025-06-03T06:07:19.464849+00:00"} {"global_step": 233008, "acc_step": 0, "speed/wps": 5555.0503678840805, "speed/FLOPS": 245504792935150.16, "speed/curr_iter_time": 2.9481, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9481, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 190.81, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.053057920187711716, "optim/lr": 2.1258519991273817e-05, "optim/total_tokens": 1954612772864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2793794870376587, "created_at": "2025-06-03T06:07:22.420755+00:00"} {"global_step": 233009, "acc_step": 0, "speed/wps": 5522.008736359023, "speed/FLOPS": 244044521944144.06, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04866890609264374, "optim/lr": 2.125497276617927e-05, "optim/total_tokens": 1954621161472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2955702543258667, "created_at": "2025-06-03T06:07:25.390920+00:00"} {"global_step": 233010, "acc_step": 0, "speed/wps": 5530.440053312731, "speed/FLOPS": 244417142998105.66, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04846365749835968, "optim/lr": 2.1251425541084944e-05, "optim/total_tokens": 1954629550080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2933493852615356, "created_at": "2025-06-03T06:07:28.356806+00:00"} {"global_step": 233011, "acc_step": 0, "speed/wps": 5532.37550008671, "speed/FLOPS": 244502679839000.94, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.6, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04351530224084854, "optim/lr": 2.1247878315990398e-05, "optim/total_tokens": 1954637938688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2899154424667358, "created_at": "2025-06-03T06:07:31.322426+00:00"} {"global_step": 233012, "acc_step": 0, "speed/wps": 5541.143661497787, "speed/FLOPS": 244890187693852.0, "speed/curr_iter_time": 2.9555, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9555, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.3, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.047555066645145416, "optim/lr": 2.124433109089585e-05, "optim/total_tokens": 1954646327296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.274033784866333, "created_at": "2025-06-03T06:07:34.287352+00:00"} {"global_step": 233013, "acc_step": 0, "speed/wps": 5514.962134019316, "speed/FLOPS": 243733098188509.44, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04610986262559891, "optim/lr": 2.1240783865801305e-05, "optim/total_tokens": 1954654715904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2847710847854614, "created_at": "2025-06-03T06:07:37.263687+00:00"} {"global_step": 233014, "acc_step": 0, "speed/wps": 5549.928095041971, "speed/FLOPS": 245278414693698.03, "speed/curr_iter_time": 2.9499, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9499, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 190.94, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.055660925805568695, "optim/lr": 2.123723664070698e-05, "optim/total_tokens": 1954663104512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.294784426689148, "created_at": "2025-06-03T06:07:40.224325+00:00"} {"global_step": 233015, "acc_step": 0, "speed/wps": 5534.5923042032755, "speed/FLOPS": 244600651234321.03, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.53, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04672989994287491, "optim/lr": 2.1233689415612433e-05, "optim/total_tokens": 1954671493120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2799344062805176, "created_at": "2025-06-03T06:07:43.188069+00:00"} {"global_step": 233016, "acc_step": 0, "speed/wps": 5517.435893971445, "speed/FLOPS": 243842425716542.25, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04976871237158775, "optim/lr": 2.1230142190517886e-05, "optim/total_tokens": 1954679881728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2828210592269897, "created_at": "2025-06-03T06:07:46.161046+00:00"} {"global_step": 233017, "acc_step": 0, "speed/wps": 5539.19947250653, "speed/FLOPS": 244804264491699.78, "speed/curr_iter_time": 2.9558, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9558, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 191.32, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04589347541332245, "optim/lr": 2.122659496542334e-05, "optim/total_tokens": 1954688270336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2716807126998901, "created_at": "2025-06-03T06:07:49.125845+00:00"} {"global_step": 233018, "acc_step": 0, "speed/wps": 5524.786787704204, "speed/FLOPS": 244167297594245.25, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04362698271870613, "optim/lr": 2.1223047740329017e-05, "optim/total_tokens": 1954696658944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.292974829673767, "created_at": "2025-06-03T06:07:52.094435+00:00"} {"global_step": 233019, "acc_step": 0, "speed/wps": 5524.763015927985, "speed/FLOPS": 244166247003411.38, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.046832192689180374, "optim/lr": 2.1219500515234467e-05, "optim/total_tokens": 1954705047552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2843496799468994, "created_at": "2025-06-03T06:07:55.063536+00:00"} {"global_step": 233020, "acc_step": 0, "speed/wps": 5526.695794033361, "speed/FLOPS": 244251665902813.88, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04373285919427872, "optim/lr": 2.121595329013992e-05, "optim/total_tokens": 1954713436160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2843379974365234, "created_at": "2025-06-03T06:07:58.033487+00:00"} {"global_step": 233021, "acc_step": 0, "speed/wps": 5513.665539980367, "speed/FLOPS": 243675795368557.78, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04457102715969086, "optim/lr": 2.1212406065045375e-05, "optim/total_tokens": 1954721824768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.293896198272705, "created_at": "2025-06-03T06:08:01.010406+00:00"} {"global_step": 233022, "acc_step": 0, "speed/wps": 5524.466235556127, "speed/FLOPS": 244153130830034.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04328169301152229, "optim/lr": 2.1208858839951052e-05, "optim/total_tokens": 1954730213376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.3013046979904175, "created_at": "2025-06-03T06:08:03.979938+00:00"} {"global_step": 233023, "acc_step": 0, "speed/wps": 5523.00171243885, "speed/FLOPS": 244088406404360.1, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.042489033192396164, "optim/lr": 2.1205311614856505e-05, "optim/total_tokens": 1954738601984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.280462622642517, "created_at": "2025-06-03T06:08:06.949714+00:00"} {"global_step": 233024, "acc_step": 0, "speed/wps": 5519.88879596138, "speed/FLOPS": 243950831429406.88, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04295627772808075, "optim/lr": 2.1201764389761956e-05, "optim/total_tokens": 1954746990592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2826968431472778, "created_at": "2025-06-03T06:08:09.922537+00:00"} {"global_step": 233025, "acc_step": 0, "speed/wps": 5486.797974228866, "speed/FLOPS": 242488386483009.53, "speed/curr_iter_time": 2.9849, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9849, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.95 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.95, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043401338160037994, "optim/lr": 2.119821716466741e-05, "optim/total_tokens": 1954755379200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2874541282653809, "created_at": "2025-06-03T06:08:12.914537+00:00"} {"global_step": 233026, "acc_step": 0, "speed/wps": 5509.798473864007, "speed/FLOPS": 243504890839653.38, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04420366883277893, "optim/lr": 2.1194669939573086e-05, "optim/total_tokens": 1954763767808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2997380495071411, "created_at": "2025-06-03T06:08:15.894301+00:00"} {"global_step": 233027, "acc_step": 0, "speed/wps": 5501.83844195783, "speed/FLOPS": 243153098172537.1, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04344897344708443, "optim/lr": 2.119112271447854e-05, "optim/total_tokens": 1954772156416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.286344051361084, "created_at": "2025-06-03T06:08:18.875978+00:00"} {"global_step": 233028, "acc_step": 0, "speed/wps": 5499.050973980947, "speed/FLOPS": 243029906355513.38, "speed/curr_iter_time": 2.9783, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9783, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04358983784914017, "optim/lr": 2.1187575489383994e-05, "optim/total_tokens": 1954780545024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.280720591545105, "created_at": "2025-06-03T06:08:21.861600+00:00"} {"global_step": 233029, "acc_step": 0, "speed/wps": 5526.5619960625645, "speed/FLOPS": 244245752717344.75, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04422811418771744, "optim/lr": 2.1184028264289444e-05, "optim/total_tokens": 1954788933632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.3079893589019775, "created_at": "2025-06-03T06:08:24.832844+00:00"} {"global_step": 233030, "acc_step": 0, "speed/wps": 5497.578939055816, "speed/FLOPS": 242964849946380.34, "speed/curr_iter_time": 2.979, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.979, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.94 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.94, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.04357115179300308, "optim/lr": 2.118048103919512e-05, "optim/total_tokens": 1954797322240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2884836196899414, "created_at": "2025-06-03T06:08:27.816549+00:00"} {"global_step": 233031, "acc_step": 0, "speed/wps": 5511.063962110931, "speed/FLOPS": 243560818942811.4, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.93 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.93, "speed/est_time_remaining_days": 0.21, "optim/grad_norm": 0.043151333928108215, "optim/lr": 2.1176933814100575e-05, "optim/total_tokens": 1954805710848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.28853178024292, "created_at": "2025-06-03T06:08:30.792710+00:00"} {"global_step": 233032, "acc_step": 0, "speed/wps": 5525.7818775334, "speed/FLOPS": 244211275471364.28, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04238928109407425, "optim/lr": 2.1173386589006028e-05, "optim/total_tokens": 1954814099456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2922474145889282, "created_at": "2025-06-03T06:08:33.761319+00:00"} {"global_step": 233033, "acc_step": 0, "speed/wps": 5521.281221720019, "speed/FLOPS": 244012369520857.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044550132006406784, "optim/lr": 2.1169839363911702e-05, "optim/total_tokens": 1954822488064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.286530613899231, "created_at": "2025-06-03T06:08:36.735826+00:00"} {"global_step": 233034, "acc_step": 0, "speed/wps": 5526.465767912822, "speed/FLOPS": 244241499925666.44, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04642016440629959, "optim/lr": 2.1166292138817156e-05, "optim/total_tokens": 1954830876672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.279900312423706, "created_at": "2025-06-03T06:08:39.704086+00:00"} {"global_step": 233035, "acc_step": 0, "speed/wps": 5520.683066558144, "speed/FLOPS": 243985934124338.38, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04515596851706505, "optim/lr": 2.116274491372261e-05, "optim/total_tokens": 1954839265280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2831859588623047, "created_at": "2025-06-03T06:08:42.677648+00:00"} {"global_step": 233036, "acc_step": 0, "speed/wps": 5516.3118265441135, "speed/FLOPS": 243792747689752.88, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04422657564282417, "optim/lr": 2.1159197688628063e-05, "optim/total_tokens": 1954847653888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.274888515472412, "created_at": "2025-06-03T06:08:45.655235+00:00"} {"global_step": 233037, "acc_step": 0, "speed/wps": 5526.911628283781, "speed/FLOPS": 244261204671942.6, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049931030720472336, "optim/lr": 2.1155650463533737e-05, "optim/total_tokens": 1954856042496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2824617624282837, "created_at": "2025-06-03T06:08:48.626669+00:00"} {"global_step": 233038, "acc_step": 0, "speed/wps": 5521.182627151885, "speed/FLOPS": 244008012145598.8, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04404105618596077, "optim/lr": 2.115210323843919e-05, "optim/total_tokens": 1954864431104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2816842794418335, "created_at": "2025-06-03T06:08:51.601801+00:00"} {"global_step": 233039, "acc_step": 0, "speed/wps": 5517.366553365307, "speed/FLOPS": 243839361216668.34, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05056225508451462, "optim/lr": 2.1148556013344644e-05, "optim/total_tokens": 1954872819712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.319851040840149, "created_at": "2025-06-03T06:08:54.577915+00:00"} {"global_step": 233040, "acc_step": 0, "speed/wps": 5526.393750579027, "speed/FLOPS": 244238317128130.84, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042752642184495926, "optim/lr": 2.1145008788250098e-05, "optim/total_tokens": 1954881208320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2808630466461182, "created_at": "2025-06-03T06:08:57.549122+00:00"} {"global_step": 233041, "acc_step": 0, "speed/wps": 5525.986213608216, "speed/FLOPS": 244220306079984.28, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043768659234046936, "optim/lr": 2.114146156315577e-05, "optim/total_tokens": 1954889596928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.301208257675171, "created_at": "2025-06-03T06:09:00.517335+00:00"} {"global_step": 233042, "acc_step": 0, "speed/wps": 5514.746656360795, "speed/FLOPS": 243723575178917.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.92 hours", "speed/est_time_elapsed_hrs": 192.25, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.92, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044082753360271454, "optim/lr": 2.1137914338061225e-05, "optim/total_tokens": 1954897985536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3074893951416016, "created_at": "2025-06-03T06:09:03.493593+00:00"} {"global_step": 233043, "acc_step": 0, "speed/wps": 5526.096573228365, "speed/FLOPS": 244225183410323.12, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0436842255294323, "optim/lr": 2.113436711296668e-05, "optim/total_tokens": 1954906374144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.288604497909546, "created_at": "2025-06-03T06:09:06.464532+00:00"} {"global_step": 233044, "acc_step": 0, "speed/wps": 5529.1635735040845, "speed/FLOPS": 244360729124179.44, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.68, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04510974511504173, "optim/lr": 2.1130819887872132e-05, "optim/total_tokens": 1954914762752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2765792608261108, "created_at": "2025-06-03T06:09:09.435898+00:00"} {"global_step": 233045, "acc_step": 0, "speed/wps": 5524.332409769683, "speed/FLOPS": 244147216415256.56, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.91, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04269509017467499, "optim/lr": 2.112727266277781e-05, "optim/total_tokens": 1954923151360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2794183492660522, "created_at": "2025-06-03T06:09:12.409562+00:00"} {"global_step": 233046, "acc_step": 0, "speed/wps": 5518.510902559099, "speed/FLOPS": 243889935593723.8, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0438193753361702, "optim/lr": 2.112372543768326e-05, "optim/total_tokens": 1954931539968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2882180213928223, "created_at": "2025-06-03T06:09:15.386026+00:00"} {"global_step": 233047, "acc_step": 0, "speed/wps": 5510.450767478074, "speed/FLOPS": 243533718878653.78, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04426182806491852, "optim/lr": 2.1120178212588713e-05, "optim/total_tokens": 1954939928576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2886079549789429, "created_at": "2025-06-03T06:09:18.362996+00:00"} {"global_step": 233048, "acc_step": 0, "speed/wps": 5520.182869284657, "speed/FLOPS": 243963827965091.97, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04474005103111267, "optim/lr": 2.1116630987494167e-05, "optim/total_tokens": 1954948317184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.30601167678833, "created_at": "2025-06-03T06:09:21.334484+00:00"} {"global_step": 233049, "acc_step": 0, "speed/wps": 5543.181017415397, "speed/FLOPS": 244980228397277.44, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.26, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04882757365703583, "optim/lr": 2.1113083762399844e-05, "optim/total_tokens": 1954956705792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.3035500049591064, "created_at": "2025-06-03T06:09:24.297242+00:00"} {"global_step": 233050, "acc_step": 0, "speed/wps": 5525.986802478565, "speed/FLOPS": 244220332105039.6, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04621119052171707, "optim/lr": 2.1109536537305298e-05, "optim/total_tokens": 1954965094400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2865285873413086, "created_at": "2025-06-03T06:09:27.265630+00:00"} {"global_step": 233051, "acc_step": 0, "speed/wps": 5512.4209901937575, "speed/FLOPS": 243620792638172.94, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.059548016637563705, "optim/lr": 2.1105989312210748e-05, "optim/total_tokens": 1954973483008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2772902250289917, "created_at": "2025-06-03T06:09:30.241855+00:00"} {"global_step": 233052, "acc_step": 0, "speed/wps": 5520.174076006335, "speed/FLOPS": 243963439347198.22, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05910704284906387, "optim/lr": 2.11024420871162e-05, "optim/total_tokens": 1954981871616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2776447534561157, "created_at": "2025-06-03T06:09:33.217201+00:00"} {"global_step": 233053, "acc_step": 0, "speed/wps": 5523.082811080319, "speed/FLOPS": 244091990549212.56, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049650873988866806, "optim/lr": 2.109889486202188e-05, "optim/total_tokens": 1954990260224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2652671337127686, "created_at": "2025-06-03T06:09:36.189468+00:00"} {"global_step": 233054, "acc_step": 0, "speed/wps": 5520.152555413751, "speed/FLOPS": 243962488247158.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05153079330921173, "optim/lr": 2.1095347636927332e-05, "optim/total_tokens": 1954998648832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.289806604385376, "created_at": "2025-06-03T06:09:39.164483+00:00"} {"global_step": 233055, "acc_step": 0, "speed/wps": 5512.104482702959, "speed/FLOPS": 243606804627111.84, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049220141023397446, "optim/lr": 2.1091800411832786e-05, "optim/total_tokens": 1955007037440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3086432218551636, "created_at": "2025-06-03T06:09:42.143165+00:00"} {"global_step": 233056, "acc_step": 0, "speed/wps": 5521.93978471228, "speed/FLOPS": 244041474634284.56, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04724029824137688, "optim/lr": 2.1088253186738236e-05, "optim/total_tokens": 1955015426048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2964433431625366, "created_at": "2025-06-03T06:09:45.113945+00:00"} {"global_step": 233057, "acc_step": 0, "speed/wps": 5528.208342465338, "speed/FLOPS": 244318512801582.53, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046112723648548126, "optim/lr": 2.1084705961643913e-05, "optim/total_tokens": 1955023814656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2868475914001465, "created_at": "2025-06-03T06:09:48.081462+00:00"} {"global_step": 233058, "acc_step": 0, "speed/wps": 5532.25767133703, "speed/FLOPS": 244497472411367.25, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 191.64, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04393061622977257, "optim/lr": 2.1081158736549367e-05, "optim/total_tokens": 1955032203264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2959696054458618, "created_at": "2025-06-03T06:09:51.050580+00:00"} {"global_step": 233059, "acc_step": 0, "speed/wps": 5522.312236544769, "speed/FLOPS": 244057935098899.28, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04482823982834816, "optim/lr": 2.107761151145482e-05, "optim/total_tokens": 1955040591872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.283972144126892, "created_at": "2025-06-03T06:09:54.025419+00:00"} {"global_step": 233060, "acc_step": 0, "speed/wps": 5534.106209864694, "speed/FLOPS": 244579168352612.12, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.58, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04332756996154785, "optim/lr": 2.1074064286360494e-05, "optim/total_tokens": 1955048980480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2817200422286987, "created_at": "2025-06-03T06:09:56.989250+00:00"} {"global_step": 233061, "acc_step": 0, "speed/wps": 5519.669359079431, "speed/FLOPS": 243941133442404.5, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04427511245012283, "optim/lr": 2.1070517061265948e-05, "optim/total_tokens": 1955057369088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3055064678192139, "created_at": "2025-06-03T06:09:59.961716+00:00"} {"global_step": 233062, "acc_step": 0, "speed/wps": 5525.5428806244745, "speed/FLOPS": 244200713031286.84, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042767804116010666, "optim/lr": 2.10669698361714e-05, "optim/total_tokens": 1955065757696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2747652530670166, "created_at": "2025-06-03T06:10:02.930481+00:00"} {"global_step": 233063, "acc_step": 0, "speed/wps": 5519.9826764982545, "speed/FLOPS": 243954980468612.56, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042360950261354446, "optim/lr": 2.1063422611076855e-05, "optim/total_tokens": 1955074146304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3163247108459473, "created_at": "2025-06-03T06:10:05.906379+00:00"} {"global_step": 233064, "acc_step": 0, "speed/wps": 5518.60142754241, "speed/FLOPS": 243893936334637.3, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04484602063894272, "optim/lr": 2.105987538598253e-05, "optim/total_tokens": 1955082534912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2859655618667603, "created_at": "2025-06-03T06:10:08.882270+00:00"} {"global_step": 233065, "acc_step": 0, "speed/wps": 5504.415638359705, "speed/FLOPS": 243266997062212.97, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.91 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.91, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04430585354566574, "optim/lr": 2.1056328160887983e-05, "optim/total_tokens": 1955090923520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3067728281021118, "created_at": "2025-06-03T06:10:11.864732+00:00"} {"global_step": 233066, "acc_step": 0, "speed/wps": 5532.2688796512375, "speed/FLOPS": 244497967761485.88, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.65, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04432892054319382, "optim/lr": 2.1052780935793436e-05, "optim/total_tokens": 1955099312128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2733409404754639, "created_at": "2025-06-03T06:10:14.833451+00:00"} {"global_step": 233067, "acc_step": 0, "speed/wps": 5524.173226995483, "speed/FLOPS": 244140181351408.2, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04384787380695343, "optim/lr": 2.104923371069889e-05, "optim/total_tokens": 1955107700736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2892489433288574, "created_at": "2025-06-03T06:10:17.802758+00:00"} {"global_step": 233068, "acc_step": 0, "speed/wps": 5524.525630803603, "speed/FLOPS": 244155755795960.9, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04725038632750511, "optim/lr": 2.1045686485604564e-05, "optim/total_tokens": 1955116089344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2735488414764404, "created_at": "2025-06-03T06:10:20.771579+00:00"} {"global_step": 233069, "acc_step": 0, "speed/wps": 5525.874790053609, "speed/FLOPS": 244215381729188.12, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04435281828045845, "optim/lr": 2.1042139260510017e-05, "optim/total_tokens": 1955124477952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2998181581497192, "created_at": "2025-06-03T06:10:23.743591+00:00"} {"global_step": 233070, "acc_step": 0, "speed/wps": 5525.786918797426, "speed/FLOPS": 244211498269430.7, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04987075552344322, "optim/lr": 2.103859203541547e-05, "optim/total_tokens": 1955132866560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2768304347991943, "created_at": "2025-06-03T06:10:26.712078+00:00"} {"global_step": 233071, "acc_step": 0, "speed/wps": 5511.676099132067, "speed/FLOPS": 243587872265944.28, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04417182505130768, "optim/lr": 2.1035044810320925e-05, "optim/total_tokens": 1955141255168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.288244605064392, "created_at": "2025-06-03T06:10:29.688454+00:00"} {"global_step": 233072, "acc_step": 0, "speed/wps": 5517.384566346018, "speed/FLOPS": 243840157298217.0, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04613779857754707, "optim/lr": 2.10314975852266e-05, "optim/total_tokens": 1955149643776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2815396785736084, "created_at": "2025-06-03T06:10:32.661211+00:00"} {"global_step": 233073, "acc_step": 0, "speed/wps": 5503.477775456183, "speed/FLOPS": 243225548322294.8, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04289696365594864, "optim/lr": 2.1027950360132052e-05, "optim/total_tokens": 1955158032384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2856935262680054, "created_at": "2025-06-03T06:10:35.646063+00:00"} {"global_step": 233074, "acc_step": 0, "speed/wps": 5511.978588459334, "speed/FLOPS": 243601240745928.75, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0459730438888073, "optim/lr": 2.1024403135037506e-05, "optim/total_tokens": 1955166420992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2875651121139526, "created_at": "2025-06-03T06:10:38.625707+00:00"} {"global_step": 233075, "acc_step": 0, "speed/wps": 5501.94841733009, "speed/FLOPS": 243157958521086.0, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.9 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.9, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043191730976104736, "optim/lr": 2.102085590994296e-05, "optim/total_tokens": 1955174809600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.285418152809143, "created_at": "2025-06-03T06:10:41.611540+00:00"} {"global_step": 233076, "acc_step": 0, "speed/wps": 5509.188504524479, "speed/FLOPS": 243477933316952.34, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043383680284023285, "optim/lr": 2.1017308684848636e-05, "optim/total_tokens": 1955183198208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2953625917434692, "created_at": "2025-06-03T06:10:44.590630+00:00"} {"global_step": 233077, "acc_step": 0, "speed/wps": 5523.054824401917, "speed/FLOPS": 244090753681276.03, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04290831834077835, "optim/lr": 2.1013761459754087e-05, "optim/total_tokens": 1955191586816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2824538946151733, "created_at": "2025-06-03T06:10:47.562891+00:00"} {"global_step": 233078, "acc_step": 0, "speed/wps": 5513.918300636626, "speed/FLOPS": 243686966095818.1, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04240316152572632, "optim/lr": 2.101021423465954e-05, "optim/total_tokens": 1955199975424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2934794425964355, "created_at": "2025-06-03T06:10:50.538298+00:00"} {"global_step": 233079, "acc_step": 0, "speed/wps": 5521.46488522807, "speed/FLOPS": 244020486507838.38, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04462209343910217, "optim/lr": 2.1006667009564994e-05, "optim/total_tokens": 1955208364032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2925013303756714, "created_at": "2025-06-03T06:10:53.509456+00:00"} {"global_step": 233080, "acc_step": 0, "speed/wps": 5521.258680520203, "speed/FLOPS": 244011373315202.03, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.04, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04330986365675926, "optim/lr": 2.100311978447067e-05, "optim/total_tokens": 1955216752640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2895257472991943, "created_at": "2025-06-03T06:10:56.484890+00:00"} {"global_step": 233081, "acc_step": 0, "speed/wps": 5504.047776711916, "speed/FLOPS": 243250739460267.3, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04549160972237587, "optim/lr": 2.0999572559376125e-05, "optim/total_tokens": 1955225141248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.277900218963623, "created_at": "2025-06-03T06:10:59.464842+00:00"} {"global_step": 233082, "acc_step": 0, "speed/wps": 5510.593048078264, "speed/FLOPS": 243540006952924.0, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05864328145980835, "optim/lr": 2.0996025334281575e-05, "optim/total_tokens": 1955233529856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.296470046043396, "created_at": "2025-06-03T06:11:02.442377+00:00"} {"global_step": 233083, "acc_step": 0, "speed/wps": 5521.672847528783, "speed/FLOPS": 244029677377082.34, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04416836425662041, "optim/lr": 2.099247810918703e-05, "optim/total_tokens": 1955241918464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.293728232383728, "created_at": "2025-06-03T06:11:05.413024+00:00"} {"global_step": 233084, "acc_step": 0, "speed/wps": 5502.077042898507, "speed/FLOPS": 243163643112844.72, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042998556047677994, "optim/lr": 2.0988930884092706e-05, "optim/total_tokens": 1955250307072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2892727851867676, "created_at": "2025-06-03T06:11:08.394142+00:00"} {"global_step": 233085, "acc_step": 0, "speed/wps": 5519.960969474123, "speed/FLOPS": 243954021129252.56, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043284542858600616, "optim/lr": 2.098538365899816e-05, "optim/total_tokens": 1955258695680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2869004011154175, "created_at": "2025-06-03T06:11:11.365464+00:00"} {"global_step": 233086, "acc_step": 0, "speed/wps": 5514.946473853951, "speed/FLOPS": 243732406089356.28, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04493290185928345, "optim/lr": 2.0981836433903613e-05, "optim/total_tokens": 1955267084288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2865545749664307, "created_at": "2025-06-03T06:11:14.341005+00:00"} {"global_step": 233087, "acc_step": 0, "speed/wps": 5530.64046938297, "speed/FLOPS": 244426000362587.78, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.86 hours", "speed/est_time_elapsed_hrs": 191.72, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.86, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04275314509868622, "optim/lr": 2.0978289208809287e-05, "optim/total_tokens": 1955275472896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2991838455200195, "created_at": "2025-06-03T06:11:17.307124+00:00"} {"global_step": 233088, "acc_step": 0, "speed/wps": 5509.918102962939, "speed/FLOPS": 243510177833508.94, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04376796633005142, "optim/lr": 2.097474198371474e-05, "optim/total_tokens": 1955283861504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2919371128082275, "created_at": "2025-06-03T06:11:20.284085+00:00"} {"global_step": 233089, "acc_step": 0, "speed/wps": 5510.844053275075, "speed/FLOPS": 243551100097862.0, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.88 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.88, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046567417681217194, "optim/lr": 2.0971194758620194e-05, "optim/total_tokens": 1955292250112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2854067087173462, "created_at": "2025-06-03T06:11:23.264676+00:00"} {"global_step": 233090, "acc_step": 0, "speed/wps": 5501.381010722356, "speed/FLOPS": 243132882053274.47, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.89 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.89, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04461552947759628, "optim/lr": 2.0967647533525648e-05, "optim/total_tokens": 1955300638720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2977179288864136, "created_at": "2025-06-03T06:11:26.248896+00:00"} {"global_step": 233091, "acc_step": 0, "speed/wps": 5518.812667083378, "speed/FLOPS": 243903272041126.1, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04290187358856201, "optim/lr": 2.096410030843132e-05, "optim/total_tokens": 1955309027328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2824265956878662, "created_at": "2025-06-03T06:11:29.225169+00:00"} {"global_step": 233092, "acc_step": 0, "speed/wps": 5531.647330427308, "speed/FLOPS": 244470498467165.5, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.86 hours", "speed/est_time_elapsed_hrs": 191.7, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.86, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04335624724626541, "optim/lr": 2.0960553083336775e-05, "optim/total_tokens": 1955317415936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2789274454116821, "created_at": "2025-06-03T06:11:32.194463+00:00"} {"global_step": 233093, "acc_step": 0, "speed/wps": 5519.37116762421, "speed/FLOPS": 243927954906365.97, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04332135245203972, "optim/lr": 2.095700585824223e-05, "optim/total_tokens": 1955325804544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2923388481140137, "created_at": "2025-06-03T06:11:35.171776+00:00"} {"global_step": 233094, "acc_step": 0, "speed/wps": 5522.278408935017, "speed/FLOPS": 244056440091693.66, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.86 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.86, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04320196434855461, "optim/lr": 2.0953458633147682e-05, "optim/total_tokens": 1955334193152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2872304916381836, "created_at": "2025-06-03T06:11:38.143479+00:00"} {"global_step": 233095, "acc_step": 0, "speed/wps": 5533.559213141253, "speed/FLOPS": 244554993897219.06, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 191.63, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04480113834142685, "optim/lr": 2.0949911408053356e-05, "optim/total_tokens": 1955342581760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.291691780090332, "created_at": "2025-06-03T06:11:41.108056+00:00"} {"global_step": 233096, "acc_step": 0, "speed/wps": 5517.01504713774, "speed/FLOPS": 243823826440581.88, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04445934295654297, "optim/lr": 2.094636418295881e-05, "optim/total_tokens": 1955350970368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2965940237045288, "created_at": "2025-06-03T06:11:44.081011+00:00"} {"global_step": 233097, "acc_step": 0, "speed/wps": 5518.052813414234, "speed/FLOPS": 243869690398233.6, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04269815608859062, "optim/lr": 2.0942816957864263e-05, "optim/total_tokens": 1955359358976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2958728075027466, "created_at": "2025-06-03T06:11:47.057584+00:00"} {"global_step": 233098, "acc_step": 0, "speed/wps": 5506.306095991816, "speed/FLOPS": 243350545613312.94, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04345545545220375, "optim/lr": 2.0939269732769717e-05, "optim/total_tokens": 1955367747584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2910195589065552, "created_at": "2025-06-03T06:11:50.036392+00:00"} {"global_step": 233099, "acc_step": 0, "speed/wps": 5516.355017757142, "speed/FLOPS": 243794656520296.1, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04489228501915932, "optim/lr": 2.093572250767539e-05, "optim/total_tokens": 1955376136192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2831602096557617, "created_at": "2025-06-03T06:11:53.010484+00:00"} {"global_step": 233100, "acc_step": 0, "speed/wps": 5514.079825917564, "speed/FLOPS": 243694104686474.25, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.87 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.87, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045428402721881866, "optim/lr": 2.0932175282580844e-05, "optim/total_tokens": 1955384524800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.28996741771698, "created_at": "2025-06-03T06:11:55.992481+00:00"} {"global_step": 233101, "acc_step": 0, "speed/wps": 258.7461939970963, "speed/FLOPS": 11435257391592.547, "speed/curr_iter_time": 2.8813, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.8813, "speed/est_time_elapsed": "7.77 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 186.56, "speed/est_time_elapsed_days": 7.77, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04349131137132645, "optim/lr": 2.0928628057486298e-05, "optim/total_tokens": 1955392913408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2986736297607422, "created_at": "2025-06-03T06:12:59.320010+00:00"} {"global_step": 233102, "acc_step": 0, "speed/wps": 5596.029246352721, "speed/FLOPS": 247315849614549.88, "speed/curr_iter_time": 2.9262, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9262, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 189.47, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0449027493596077, "optim/lr": 2.092508083239175e-05, "optim/total_tokens": 1955401302016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2874419689178467, "created_at": "2025-06-03T06:13:02.253150+00:00"} {"global_step": 233103, "acc_step": 0, "speed/wps": 5557.058781558318, "speed/FLOPS": 245593554539558.34, "speed/curr_iter_time": 2.9471, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9471, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 190.83, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045718587934970856, "optim/lr": 2.092153360729743e-05, "optim/total_tokens": 1955409690624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2928048372268677, "created_at": "2025-06-03T06:13:05.205486+00:00"} {"global_step": 233104, "acc_step": 0, "speed/wps": 5554.898668482633, "speed/FLOPS": 245498088598074.12, "speed/curr_iter_time": 2.9473, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9473, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 190.84, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04568924754858017, "optim/lr": 2.091798638220288e-05, "optim/total_tokens": 1955418079232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2866063117980957, "created_at": "2025-06-03T06:13:08.162784+00:00"} {"global_step": 233105, "acc_step": 0, "speed/wps": 5528.508062059725, "speed/FLOPS": 244331758873550.47, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04338490217924118, "optim/lr": 2.0914439157108333e-05, "optim/total_tokens": 1955426467840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.292150855064392, "created_at": "2025-06-03T06:13:11.130143+00:00"} {"global_step": 233106, "acc_step": 0, "speed/wps": 5541.624379165041, "speed/FLOPS": 244911432954208.56, "speed/curr_iter_time": 2.9553, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9553, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.36, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05620993673801422, "optim/lr": 2.0910891932013786e-05, "optim/total_tokens": 1955434856448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.311784029006958, "created_at": "2025-06-03T06:13:14.094613+00:00"} {"global_step": 233107, "acc_step": 0, "speed/wps": 5536.329740307125, "speed/FLOPS": 244677437017107.03, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.54, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043092623353004456, "optim/lr": 2.0907344706919463e-05, "optim/total_tokens": 1955443245056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2781014442443848, "created_at": "2025-06-03T06:13:17.061457+00:00"} {"global_step": 233108, "acc_step": 0, "speed/wps": 5528.238526857044, "speed/FLOPS": 244319846797198.22, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04400932788848877, "optim/lr": 2.0903797481824917e-05, "optim/total_tokens": 1955451633664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.3012444972991943, "created_at": "2025-06-03T06:13:20.033094+00:00"} {"global_step": 233109, "acc_step": 0, "speed/wps": 5530.065121047441, "speed/FLOPS": 244400572911057.16, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04464789107441902, "optim/lr": 2.0900250256730367e-05, "optim/total_tokens": 1955460022272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2806473970413208, "created_at": "2025-06-03T06:13:23.003258+00:00"} {"global_step": 233110, "acc_step": 0, "speed/wps": 5516.832423031088, "speed/FLOPS": 243815755389822.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.86 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.86, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045323796570301056, "optim/lr": 2.089670303163582e-05, "optim/total_tokens": 1955468410880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.304127812385559, "created_at": "2025-06-03T06:13:25.977050+00:00"} {"global_step": 233111, "acc_step": 0, "speed/wps": 5517.817379587025, "speed/FLOPS": 243859285428130.53, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05273295193910599, "optim/lr": 2.0893155806541498e-05, "optim/total_tokens": 1955476799488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2875938415527344, "created_at": "2025-06-03T06:13:28.954134+00:00"} {"global_step": 233112, "acc_step": 0, "speed/wps": 5521.883953096888, "speed/FLOPS": 244039007162656.34, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04337690398097038, "optim/lr": 2.0889608581446952e-05, "optim/total_tokens": 1955485188096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2832772731781006, "created_at": "2025-06-03T06:13:31.925931+00:00"} {"global_step": 233113, "acc_step": 0, "speed/wps": 5540.369022637106, "speed/FLOPS": 244855952621171.03, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045137740671634674, "optim/lr": 2.0886061356352405e-05, "optim/total_tokens": 1955493576704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2879892587661743, "created_at": "2025-06-03T06:13:34.888131+00:00"} {"global_step": 233114, "acc_step": 0, "speed/wps": 5537.443620217402, "speed/FLOPS": 244726664807787.06, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.51, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043325621634721756, "optim/lr": 2.088251413125808e-05, "optim/total_tokens": 1955501965312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2775965929031372, "created_at": "2025-06-03T06:13:37.850422+00:00"} {"global_step": 233115, "acc_step": 0, "speed/wps": 5533.527310577787, "speed/FLOPS": 244553583967205.97, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.59, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.048351485282182693, "optim/lr": 2.0878966906163533e-05, "optim/total_tokens": 1955510353920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2927097082138062, "created_at": "2025-06-03T06:13:40.814780+00:00"} {"global_step": 233116, "acc_step": 0, "speed/wps": 5529.36798727219, "speed/FLOPS": 244369763166445.2, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.79, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04493643343448639, "optim/lr": 2.0875419681068986e-05, "optim/total_tokens": 1955518742528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2700961828231812, "created_at": "2025-06-03T06:13:43.786129+00:00"} {"global_step": 233117, "acc_step": 0, "speed/wps": 5527.247495325023, "speed/FLOPS": 244276048276042.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04424607381224632, "optim/lr": 2.087187245597444e-05, "optim/total_tokens": 1955527131136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2729637622833252, "created_at": "2025-06-03T06:13:46.756946+00:00"} {"global_step": 233118, "acc_step": 0, "speed/wps": 5526.152452742099, "speed/FLOPS": 244227652998812.9, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.84, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045150794088840485, "optim/lr": 2.0868325230880114e-05, "optim/total_tokens": 1955535519744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2780742645263672, "created_at": "2025-06-03T06:13:49.729855+00:00"} {"global_step": 233119, "acc_step": 0, "speed/wps": 5518.174072565909, "speed/FLOPS": 243875049432077.03, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044582124799489975, "optim/lr": 2.0864778005785567e-05, "optim/total_tokens": 1955543908352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3051837682724, "created_at": "2025-06-03T06:13:52.702488+00:00"} {"global_step": 233120, "acc_step": 0, "speed/wps": 5520.260130174142, "speed/FLOPS": 243967242500950.16, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049049634486436844, "optim/lr": 2.086123078069102e-05, "optim/total_tokens": 1955552296960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2657655477523804, "created_at": "2025-06-03T06:13:55.677294+00:00"} {"global_step": 233121, "acc_step": 0, "speed/wps": 5519.724381732988, "speed/FLOPS": 243943565162060.25, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043711140751838684, "optim/lr": 2.0857683555596475e-05, "optim/total_tokens": 1955560685568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2905973196029663, "created_at": "2025-06-03T06:13:58.653121+00:00"} {"global_step": 233122, "acc_step": 0, "speed/wps": 5529.212558093697, "speed/FLOPS": 244362893992314.47, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044108796864748, "optim/lr": 2.085413633050215e-05, "optim/total_tokens": 1955569074176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2971258163452148, "created_at": "2025-06-03T06:14:01.624716+00:00"} {"global_step": 233123, "acc_step": 0, "speed/wps": 5528.684034798525, "speed/FLOPS": 244339535967895.3, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04590250551700592, "optim/lr": 2.0850589105407602e-05, "optim/total_tokens": 1955577462784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2914773225784302, "created_at": "2025-06-03T06:14:04.594726+00:00"} {"global_step": 233124, "acc_step": 0, "speed/wps": 5524.826918764544, "speed/FLOPS": 244169071181702.9, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04694635793566704, "optim/lr": 2.0847041880313056e-05, "optim/total_tokens": 1955585851392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.286926031112671, "created_at": "2025-06-03T06:14:07.567754+00:00"} {"global_step": 233125, "acc_step": 0, "speed/wps": 5527.164191352228, "speed/FLOPS": 244272366666832.97, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04420619085431099, "optim/lr": 2.084349465521851e-05, "optim/total_tokens": 1955594240000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2951757907867432, "created_at": "2025-06-03T06:14:10.537447+00:00"} {"global_step": 233126, "acc_step": 0, "speed/wps": 5520.662477523627, "speed/FLOPS": 243985024194396.94, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05094024911522865, "optim/lr": 2.0839947430124183e-05, "optim/total_tokens": 1955602628608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2836554050445557, "created_at": "2025-06-03T06:14:13.512023+00:00"} {"global_step": 233127, "acc_step": 0, "speed/wps": 5527.789280308773, "speed/FLOPS": 244299992399216.94, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04343527927994728, "optim/lr": 2.0836400205029637e-05, "optim/total_tokens": 1955611017216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.298277735710144, "created_at": "2025-06-03T06:14:16.479868+00:00"} {"global_step": 233128, "acc_step": 0, "speed/wps": 5516.689390594153, "speed/FLOPS": 243809434088216.62, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04434901475906372, "optim/lr": 2.083285297993509e-05, "optim/total_tokens": 1955619405824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2791235446929932, "created_at": "2025-06-03T06:14:19.456106+00:00"} {"global_step": 233129, "acc_step": 0, "speed/wps": 5530.978279624395, "speed/FLOPS": 244440929846189.22, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04587661102414131, "optim/lr": 2.0829305754840544e-05, "optim/total_tokens": 1955627794432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.282964825630188, "created_at": "2025-06-03T06:14:22.422090+00:00"} {"global_step": 233130, "acc_step": 0, "speed/wps": 5527.057308915645, "speed/FLOPS": 244267643010209.9, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.89, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04519645497202873, "optim/lr": 2.0825758529746218e-05, "optim/total_tokens": 1955636183040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3120790719985962, "created_at": "2025-06-03T06:14:25.392743+00:00"} {"global_step": 233131, "acc_step": 0, "speed/wps": 5520.7701509893795, "speed/FLOPS": 243989782810460.47, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04470700025558472, "optim/lr": 2.082221130465167e-05, "optim/total_tokens": 1955644571648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2772108316421509, "created_at": "2025-06-03T06:14:28.367401+00:00"} {"global_step": 233132, "acc_step": 0, "speed/wps": 5514.796530285026, "speed/FLOPS": 243725779351090.56, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04656941443681717, "optim/lr": 2.0818664079557125e-05, "optim/total_tokens": 1955652960256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2697618007659912, "created_at": "2025-06-03T06:14:31.342272+00:00"} {"global_step": 233133, "acc_step": 0, "speed/wps": 5529.260391351193, "speed/FLOPS": 244365007977462.97, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 191.81, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043377988040447235, "optim/lr": 2.081511685446258e-05, "optim/total_tokens": 1955661348864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.283369779586792, "created_at": "2025-06-03T06:14:34.313188+00:00"} {"global_step": 233134, "acc_step": 0, "speed/wps": 5516.5527894722, "speed/FLOPS": 243803397017814.22, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04822174459695816, "optim/lr": 2.0811569629368256e-05, "optim/total_tokens": 1955669737472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2891254425048828, "created_at": "2025-06-03T06:14:37.286567+00:00"} {"global_step": 233135, "acc_step": 0, "speed/wps": 5514.950329673011, "speed/FLOPS": 243732576496822.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.25, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044356003403663635, "optim/lr": 2.0808022404273706e-05, "optim/total_tokens": 1955678126080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2826184034347534, "created_at": "2025-06-03T06:14:40.263010+00:00"} {"global_step": 233136, "acc_step": 0, "speed/wps": 5514.167043937645, "speed/FLOPS": 243697959276539.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0440831184387207, "optim/lr": 2.080447517917916e-05, "optim/total_tokens": 1955686514688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2916845083236694, "created_at": "2025-06-03T06:14:43.241564+00:00"} {"global_step": 233137, "acc_step": 0, "speed/wps": 5502.5792587894275, "speed/FLOPS": 243185838484649.44, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05033193156123161, "optim/lr": 2.0800927954084613e-05, "optim/total_tokens": 1955694903296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2830796241760254, "created_at": "2025-06-03T06:14:46.223817+00:00"} {"global_step": 233138, "acc_step": 0, "speed/wps": 5519.75317376817, "speed/FLOPS": 243944837622644.3, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04465841129422188, "optim/lr": 2.079738072899029e-05, "optim/total_tokens": 1955703291904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2915674448013306, "created_at": "2025-06-03T06:14:49.197529+00:00"} {"global_step": 233139, "acc_step": 0, "speed/wps": 5526.844664227678, "speed/FLOPS": 244258245203415.9, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04371943324804306, "optim/lr": 2.0793833503895744e-05, "optim/total_tokens": 1955711680512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2743806838989258, "created_at": "2025-06-03T06:14:52.170415+00:00"} {"global_step": 233140, "acc_step": 0, "speed/wps": 5504.651505488575, "speed/FLOPS": 243277421182031.62, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04323691129684448, "optim/lr": 2.0790286278801194e-05, "optim/total_tokens": 1955720069120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.276249885559082, "created_at": "2025-06-03T06:14:55.154558+00:00"} {"global_step": 233141, "acc_step": 0, "speed/wps": 5515.617284657367, "speed/FLOPS": 243762052493346.34, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045328326523303986, "optim/lr": 2.078673905370687e-05, "optim/total_tokens": 1955728457728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2711397409439087, "created_at": "2025-06-03T06:14:58.131303+00:00"} {"global_step": 233142, "acc_step": 0, "speed/wps": 5513.357171687353, "speed/FLOPS": 243662167068378.6, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043036963790655136, "optim/lr": 2.0783191828612325e-05, "optim/total_tokens": 1955736846336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2955663204193115, "created_at": "2025-06-03T06:15:01.108669+00:00"} {"global_step": 233143, "acc_step": 0, "speed/wps": 5523.668307516704, "speed/FLOPS": 244117866494858.34, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.01, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04323171451687813, "optim/lr": 2.077964460351778e-05, "optim/total_tokens": 1955745234944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2927806377410889, "created_at": "2025-06-03T06:15:04.081760+00:00"} {"global_step": 233144, "acc_step": 0, "speed/wps": 5509.5559402996205, "speed/FLOPS": 243494172097506.8, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.84 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.84, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04408881813287735, "optim/lr": 2.0776097378423232e-05, "optim/total_tokens": 1955753623552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2738817930221558, "created_at": "2025-06-03T06:15:07.062304+00:00"} {"global_step": 233145, "acc_step": 0, "speed/wps": 5512.912059811568, "speed/FLOPS": 243642495401758.0, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04369185119867325, "optim/lr": 2.0772550153328906e-05, "optim/total_tokens": 1955762012160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2754051685333252, "created_at": "2025-06-03T06:15:10.042079+00:00"} {"global_step": 233146, "acc_step": 0, "speed/wps": 5510.546679078424, "speed/FLOPS": 243537957680469.16, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04402949661016464, "optim/lr": 2.076900292823436e-05, "optim/total_tokens": 1955770400768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2864606380462646, "created_at": "2025-06-03T06:15:13.019062+00:00"} {"global_step": 233147, "acc_step": 0, "speed/wps": 5522.506636433041, "speed/FLOPS": 244066526578932.1, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04265887662768364, "optim/lr": 2.0765455703139813e-05, "optim/total_tokens": 1955778789376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3001196384429932, "created_at": "2025-06-03T06:15:15.993338+00:00"} {"global_step": 233148, "acc_step": 0, "speed/wps": 5517.288725005085, "speed/FLOPS": 243835921601508.22, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04309093579649925, "optim/lr": 2.0761908478045267e-05, "optim/total_tokens": 1955787177984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2790454626083374, "created_at": "2025-06-03T06:15:18.969527+00:00"} {"global_step": 233149, "acc_step": 0, "speed/wps": 5516.8805769223, "speed/FLOPS": 243817883545340.38, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04329608008265495, "optim/lr": 2.075836125295094e-05, "optim/total_tokens": 1955795566592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2876756191253662, "created_at": "2025-06-03T06:15:21.947682+00:00"} {"global_step": 233150, "acc_step": 0, "speed/wps": 5515.3058125851385, "speed/FLOPS": 243748287022012.4, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043907951563596725, "optim/lr": 2.0754814027856394e-05, "optim/total_tokens": 1955803955200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2811630964279175, "created_at": "2025-06-03T06:15:24.921647+00:00"} {"global_step": 233151, "acc_step": 0, "speed/wps": 5514.542527043194, "speed/FLOPS": 243714553707908.03, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044120125472545624, "optim/lr": 2.0751266802761848e-05, "optim/total_tokens": 1955812343808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2950619459152222, "created_at": "2025-06-03T06:15:27.899635+00:00"} {"global_step": 233152, "acc_step": 0, "speed/wps": 5512.983587122583, "speed/FLOPS": 243645656542794.9, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0432937927544117, "optim/lr": 2.07477195776673e-05, "optim/total_tokens": 1955820732416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.284228801727295, "created_at": "2025-06-03T06:15:30.874952+00:00"} {"global_step": 233153, "acc_step": 0, "speed/wps": 5513.763012559672, "speed/FLOPS": 243680103157653.16, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.047174397855997086, "optim/lr": 2.0744172352572975e-05, "optim/total_tokens": 1955829121024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2746931314468384, "created_at": "2025-06-03T06:15:33.850099+00:00"} {"global_step": 233154, "acc_step": 0, "speed/wps": 5525.995901561201, "speed/FLOPS": 244220734237918.8, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04432643949985504, "optim/lr": 2.074062512747843e-05, "optim/total_tokens": 1955837509632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3064817190170288, "created_at": "2025-06-03T06:15:36.821609+00:00"} {"global_step": 233155, "acc_step": 0, "speed/wps": 5530.167187922479, "speed/FLOPS": 244405083744508.2, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 191.74, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04473990574479103, "optim/lr": 2.0737077902383883e-05, "optim/total_tokens": 1955845898240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2854499816894531, "created_at": "2025-06-03T06:15:39.792055+00:00"} {"global_step": 233156, "acc_step": 0, "speed/wps": 5522.381117750714, "speed/FLOPS": 244060979295636.06, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04323528707027435, "optim/lr": 2.0733530677289336e-05, "optim/total_tokens": 1955854286848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2797000408172607, "created_at": "2025-06-03T06:15:42.762954+00:00"} {"global_step": 233157, "acc_step": 0, "speed/wps": 5524.900797824313, "speed/FLOPS": 244172336257997.38, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04326838254928589, "optim/lr": 2.072998345219501e-05, "optim/total_tokens": 1955862675456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3023934364318848, "created_at": "2025-06-03T06:15:45.735270+00:00"} {"global_step": 233158, "acc_step": 0, "speed/wps": 5516.252119143187, "speed/FLOPS": 243790108928242.1, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04292254522442818, "optim/lr": 2.0726436227100464e-05, "optim/total_tokens": 1955871064064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2907637357711792, "created_at": "2025-06-03T06:15:48.711277+00:00"} {"global_step": 233159, "acc_step": 0, "speed/wps": 5515.998130974343, "speed/FLOPS": 243778883951208.53, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043454669415950775, "optim/lr": 2.0722889002005917e-05, "optim/total_tokens": 1955879452672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2883442640304565, "created_at": "2025-06-03T06:15:51.687112+00:00"} {"global_step": 233160, "acc_step": 0, "speed/wps": 5504.3294673749215, "speed/FLOPS": 243263188745748.62, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.83 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.83, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04906455799937248, "optim/lr": 2.071934177691137e-05, "optim/total_tokens": 1955887841280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.290972113609314, "created_at": "2025-06-03T06:15:54.666894+00:00"} {"global_step": 233161, "acc_step": 0, "speed/wps": 5509.991404351153, "speed/FLOPS": 243513417379677.47, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0434410534799099, "optim/lr": 2.0715794551817048e-05, "optim/total_tokens": 1955896229888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2700108289718628, "created_at": "2025-06-03T06:15:57.644221+00:00"} {"global_step": 233162, "acc_step": 0, "speed/wps": 5504.532669039471, "speed/FLOPS": 243272169219241.34, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04306081682443619, "optim/lr": 2.07122473267225e-05, "optim/total_tokens": 1955904618496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2799428701400757, "created_at": "2025-06-03T06:16:00.626661+00:00"} {"global_step": 233163, "acc_step": 0, "speed/wps": 5522.258787403795, "speed/FLOPS": 244055572920445.75, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04511795565485954, "optim/lr": 2.0708700101627952e-05, "optim/total_tokens": 1955913007104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.276323914527893, "created_at": "2025-06-03T06:16:03.598740+00:00"} {"global_step": 233164, "acc_step": 0, "speed/wps": 5526.398203567386, "speed/FLOPS": 244238513927423.84, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04320913180708885, "optim/lr": 2.0705152876533406e-05, "optim/total_tokens": 1955921395712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2929917573928833, "created_at": "2025-06-03T06:16:06.568929+00:00"} {"global_step": 233165, "acc_step": 0, "speed/wps": 5519.366731580796, "speed/FLOPS": 243927758855952.78, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043286509811878204, "optim/lr": 2.0701605651439083e-05, "optim/total_tokens": 1955929784320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2923309803009033, "created_at": "2025-06-03T06:16:09.541704+00:00"} {"global_step": 233166, "acc_step": 0, "speed/wps": 5517.907679323355, "speed/FLOPS": 243863276214280.38, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04380622133612633, "optim/lr": 2.0698058426344536e-05, "optim/total_tokens": 1955938172928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2769441604614258, "created_at": "2025-06-03T06:16:12.516790+00:00"} {"global_step": 233167, "acc_step": 0, "speed/wps": 5511.575446244191, "speed/FLOPS": 243583423923488.34, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.048474688082933426, "optim/lr": 2.0694511201249987e-05, "optim/total_tokens": 1955946561536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2893368005752563, "created_at": "2025-06-03T06:16:15.493321+00:00"} {"global_step": 233168, "acc_step": 0, "speed/wps": 5513.8531023069345, "speed/FLOPS": 243684084663361.06, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04295668751001358, "optim/lr": 2.0690963976155664e-05, "optim/total_tokens": 1955954950144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.293070673942566, "created_at": "2025-06-03T06:16:18.471904+00:00"} {"global_step": 233169, "acc_step": 0, "speed/wps": 5505.100874567635, "speed/FLOPS": 243297280995246.66, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049225736409425735, "optim/lr": 2.0687416751061117e-05, "optim/total_tokens": 1955963338752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2848695516586304, "created_at": "2025-06-03T06:16:21.451568+00:00"} {"global_step": 233170, "acc_step": 0, "speed/wps": 5506.695021494937, "speed/FLOPS": 243367734129849.7, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.82 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.82, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04719657450914383, "optim/lr": 2.068386952596657e-05, "optim/total_tokens": 1955971727360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2916038036346436, "created_at": "2025-06-03T06:16:24.434160+00:00"} {"global_step": 233171, "acc_step": 0, "speed/wps": 5522.229460891629, "speed/FLOPS": 244054276838714.7, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045708417892456055, "optim/lr": 2.0680322300872025e-05, "optim/total_tokens": 1955980115968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2956972122192383, "created_at": "2025-06-03T06:16:27.403899+00:00"} {"global_step": 233172, "acc_step": 0, "speed/wps": 5516.989690762422, "speed/FLOPS": 243822705818578.5, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05121684446930885, "optim/lr": 2.06767750757777e-05, "optim/total_tokens": 1955988504576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2794976234436035, "created_at": "2025-06-03T06:16:30.379843+00:00"} {"global_step": 233173, "acc_step": 0, "speed/wps": 5520.325591841907, "speed/FLOPS": 243970135571602.2, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045735426247119904, "optim/lr": 2.0673227850683152e-05, "optim/total_tokens": 1955996893184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2858939170837402, "created_at": "2025-06-03T06:16:33.351242+00:00"} {"global_step": 233174, "acc_step": 0, "speed/wps": 5522.132824108506, "speed/FLOPS": 244050005987532.53, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.06049072742462158, "optim/lr": 2.0669680625588606e-05, "optim/total_tokens": 1956005281792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2806109189987183, "created_at": "2025-06-03T06:16:36.322747+00:00"} {"global_step": 233175, "acc_step": 0, "speed/wps": 5511.903339708933, "speed/FLOPS": 243597915136319.06, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04371771216392517, "optim/lr": 2.066613340049406e-05, "optim/total_tokens": 1956013670400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.281375527381897, "created_at": "2025-06-03T06:16:39.302346+00:00"} {"global_step": 233176, "acc_step": 0, "speed/wps": 5507.506549759312, "speed/FLOPS": 243403599525356.9, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05320354923605919, "optim/lr": 2.0662586175399733e-05, "optim/total_tokens": 1956022059008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2830811738967896, "created_at": "2025-06-03T06:16:42.285713+00:00"} {"global_step": 233177, "acc_step": 0, "speed/wps": 5517.855805538463, "speed/FLOPS": 243860983658502.22, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043752726167440414, "optim/lr": 2.0659038950305187e-05, "optim/total_tokens": 1956030447616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2947155237197876, "created_at": "2025-06-03T06:16:45.262421+00:00"} {"global_step": 233178, "acc_step": 0, "speed/wps": 5502.583417034318, "speed/FLOPS": 243186022257789.75, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.050780728459358215, "optim/lr": 2.065549172521064e-05, "optim/total_tokens": 1956038836224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2972975969314575, "created_at": "2025-06-03T06:16:48.248754+00:00"} {"global_step": 233179, "acc_step": 0, "speed/wps": 5500.957145919481, "speed/FLOPS": 243114149398524.12, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04381107538938522, "optim/lr": 2.0651944500116094e-05, "optim/total_tokens": 1956047224832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3054957389831543, "created_at": "2025-06-03T06:16:51.230402+00:00"} {"global_step": 233180, "acc_step": 0, "speed/wps": 5501.481646448518, "speed/FLOPS": 243137329637270.5, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05333669111132622, "optim/lr": 2.0648397275021768e-05, "optim/total_tokens": 1956055613440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2987481355667114, "created_at": "2025-06-03T06:16:54.213446+00:00"} {"global_step": 233181, "acc_step": 0, "speed/wps": 5514.51032782116, "speed/FLOPS": 243713130667104.7, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04309481754899025, "optim/lr": 2.064485004992722e-05, "optim/total_tokens": 1956064002048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2730889320373535, "created_at": "2025-06-03T06:16:57.187494+00:00"} {"global_step": 233182, "acc_step": 0, "speed/wps": 5515.7464385892135, "speed/FLOPS": 243767760436064.2, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04361570626497269, "optim/lr": 2.0641302824832675e-05, "optim/total_tokens": 1956072390656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.295105218887329, "created_at": "2025-06-03T06:17:00.161243+00:00"} {"global_step": 233183, "acc_step": 0, "speed/wps": 5506.172392878409, "speed/FLOPS": 243344636620054.9, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043109387159347534, "optim/lr": 2.063775559973813e-05, "optim/total_tokens": 1956080779264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2841928005218506, "created_at": "2025-06-03T06:17:03.139814+00:00"} {"global_step": 233184, "acc_step": 0, "speed/wps": 5501.456873944712, "speed/FLOPS": 243136234819399.44, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04416628181934357, "optim/lr": 2.0634208374643802e-05, "optim/total_tokens": 1956089167872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.3068174123764038, "created_at": "2025-06-03T06:17:06.122045+00:00"} {"global_step": 233185, "acc_step": 0, "speed/wps": 5510.729180287702, "speed/FLOPS": 243546023299793.38, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04252162203192711, "optim/lr": 2.0630661149549256e-05, "optim/total_tokens": 1956097556480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2810933589935303, "created_at": "2025-06-03T06:17:09.101326+00:00"} {"global_step": 233186, "acc_step": 0, "speed/wps": 5502.274490405321, "speed/FLOPS": 243172369282017.9, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042512983083724976, "optim/lr": 2.062711392445471e-05, "optim/total_tokens": 1956105945088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3056349754333496, "created_at": "2025-06-03T06:17:12.085763+00:00"} {"global_step": 233187, "acc_step": 0, "speed/wps": 5509.3321390506135, "speed/FLOPS": 243484281227819.34, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04368881508708, "optim/lr": 2.0623566699360163e-05, "optim/total_tokens": 1956114333696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3090136051177979, "created_at": "2025-06-03T06:17:15.066706+00:00"} {"global_step": 233188, "acc_step": 0, "speed/wps": 5510.720392934617, "speed/FLOPS": 243545634943764.78, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04353395849466324, "optim/lr": 2.0620019474265837e-05, "optim/total_tokens": 1956122722304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3039848804473877, "created_at": "2025-06-03T06:17:18.046976+00:00"} {"global_step": 233189, "acc_step": 0, "speed/wps": 5511.73867987093, "speed/FLOPS": 243590638014284.78, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04354549199342728, "optim/lr": 2.061647224917129e-05, "optim/total_tokens": 1956131110912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2932114601135254, "created_at": "2025-06-03T06:17:21.026775+00:00"} {"global_step": 233190, "acc_step": 0, "speed/wps": 5510.982616985847, "speed/FLOPS": 243557223904644.78, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044094011187553406, "optim/lr": 2.0612925024076744e-05, "optim/total_tokens": 1956139499520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2826542854309082, "created_at": "2025-06-03T06:17:24.003438+00:00"} {"global_step": 233191, "acc_step": 0, "speed/wps": 5521.561353927358, "speed/FLOPS": 244024749930575.38, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04422902688384056, "optim/lr": 2.0609377798982198e-05, "optim/total_tokens": 1956147888128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2926361560821533, "created_at": "2025-06-03T06:17:26.975457+00:00"} {"global_step": 233192, "acc_step": 0, "speed/wps": 5509.4274358574985, "speed/FLOPS": 243488492858910.38, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04959912598133087, "optim/lr": 2.0605830573887875e-05, "optim/total_tokens": 1956156276736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2866183519363403, "created_at": "2025-06-03T06:17:29.952735+00:00"} {"global_step": 233193, "acc_step": 0, "speed/wps": 5504.630261634248, "speed/FLOPS": 243276482312406.28, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.8 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.8, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04332442581653595, "optim/lr": 2.0602283348793325e-05, "optim/total_tokens": 1956164665344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2731682062149048, "created_at": "2025-06-03T06:17:32.934301+00:00"} {"global_step": 233194, "acc_step": 0, "speed/wps": 5510.7760676469325, "speed/FLOPS": 243548095481080.1, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04497375711798668, "optim/lr": 2.059873612369878e-05, "optim/total_tokens": 1956173053952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2900567054748535, "created_at": "2025-06-03T06:17:35.913038+00:00"} {"global_step": 233195, "acc_step": 0, "speed/wps": 5506.506038253457, "speed/FLOPS": 243359382037880.2, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04275413602590561, "optim/lr": 2.0595188898604456e-05, "optim/total_tokens": 1956181442560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2825261354446411, "created_at": "2025-06-03T06:17:38.895096+00:00"} {"global_step": 233196, "acc_step": 0, "speed/wps": 5512.253586019539, "speed/FLOPS": 243613394230524.72, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045985423028469086, "optim/lr": 2.059164167350991e-05, "optim/total_tokens": 1956189831168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2987229824066162, "created_at": "2025-06-03T06:17:41.874656+00:00"} {"global_step": 233197, "acc_step": 0, "speed/wps": 5515.4602507864665, "speed/FLOPS": 243755112400024.75, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04290008172392845, "optim/lr": 2.0588094448415363e-05, "optim/total_tokens": 1956198219776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2947330474853516, "created_at": "2025-06-03T06:17:44.852820+00:00"} {"global_step": 233198, "acc_step": 0, "speed/wps": 5488.0272423215565, "speed/FLOPS": 242542713840741.97, "speed/curr_iter_time": 2.9842, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9842, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.81 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.81, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.047955818474292755, "optim/lr": 2.0584547223320814e-05, "optim/total_tokens": 1956206608384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2771893739700317, "created_at": "2025-06-03T06:17:47.841898+00:00"} {"global_step": 233199, "acc_step": 0, "speed/wps": 5521.993680067695, "speed/FLOPS": 244043856533132.47, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04287382960319519, "optim/lr": 2.058099999822649e-05, "optim/total_tokens": 1956214996992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2751119136810303, "created_at": "2025-06-03T06:17:50.816452+00:00"} {"global_step": 233200, "acc_step": 0, "speed/wps": 5511.511836202125, "speed/FLOPS": 243580612685214.75, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04773728549480438, "optim/lr": 2.0577452773131944e-05, "optim/total_tokens": 1956223385600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.282464861869812, "created_at": "2025-06-03T06:17:53.792561+00:00"} {"global_step": 233201, "acc_step": 0, "speed/wps": 5517.599501310568, "speed/FLOPS": 243849656323513.22, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0425226204097271, "optim/lr": 2.0573905548037398e-05, "optim/total_tokens": 1956231774208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2798434495925903, "created_at": "2025-06-03T06:17:56.765957+00:00"} {"global_step": 233202, "acc_step": 0, "speed/wps": 5513.295739486247, "speed/FLOPS": 243659452079528.2, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04616556689143181, "optim/lr": 2.057035832294285e-05, "optim/total_tokens": 1956240162816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2879247665405273, "created_at": "2025-06-03T06:17:59.745079+00:00"} {"global_step": 233203, "acc_step": 0, "speed/wps": 5504.958759002684, "speed/FLOPS": 243291000214689.2, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04293902590870857, "optim/lr": 2.0566811097848526e-05, "optim/total_tokens": 1956248551424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2720814943313599, "created_at": "2025-06-03T06:18:02.728568+00:00"} {"global_step": 233204, "acc_step": 0, "speed/wps": 5502.2202603774185, "speed/FLOPS": 243169972592359.1, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044890958815813065, "optim/lr": 2.056326387275398e-05, "optim/total_tokens": 1956256940032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2803670167922974, "created_at": "2025-06-03T06:18:05.713696+00:00"} {"global_step": 233205, "acc_step": 0, "speed/wps": 5512.634449462956, "speed/FLOPS": 243630226445287.9, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043111417442560196, "optim/lr": 2.0559716647659433e-05, "optim/total_tokens": 1956265328640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.3120938539505005, "created_at": "2025-06-03T06:18:08.690512+00:00"} {"global_step": 233206, "acc_step": 0, "speed/wps": 5514.085142693205, "speed/FLOPS": 243694339660743.84, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04776134714484215, "optim/lr": 2.0556169422564886e-05, "optim/total_tokens": 1956273717248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.281515121459961, "created_at": "2025-06-03T06:18:11.668951+00:00"} {"global_step": 233207, "acc_step": 0, "speed/wps": 5512.448637748097, "speed/FLOPS": 243622014518561.72, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043595507740974426, "optim/lr": 2.055262219747056e-05, "optim/total_tokens": 1956282105856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2937442064285278, "created_at": "2025-06-03T06:18:14.648461+00:00"} {"global_step": 233208, "acc_step": 0, "speed/wps": 5513.052092408607, "speed/FLOPS": 243648684125795.3, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.049228060990571976, "optim/lr": 2.0549074972376014e-05, "optim/total_tokens": 1956290494464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2919949293136597, "created_at": "2025-06-03T06:18:17.623830+00:00"} {"global_step": 233209, "acc_step": 0, "speed/wps": 5523.151753994363, "speed/FLOPS": 244095037473131.5, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04866567254066467, "optim/lr": 2.0545527747281467e-05, "optim/total_tokens": 1956298883072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2686491012573242, "created_at": "2025-06-03T06:18:20.597498+00:00"} {"global_step": 233210, "acc_step": 0, "speed/wps": 5505.49035174236, "speed/FLOPS": 243314493892844.56, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046272289007902145, "optim/lr": 2.054198052218692e-05, "optim/total_tokens": 1956307271680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2759745121002197, "created_at": "2025-06-03T06:18:23.576320+00:00"} {"global_step": 233211, "acc_step": 0, "speed/wps": 5517.862057253542, "speed/FLOPS": 243861259952309.53, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04737408086657524, "optim/lr": 2.0538433297092595e-05, "optim/total_tokens": 1956315660288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2845814228057861, "created_at": "2025-06-03T06:18:26.549781+00:00"} {"global_step": 233212, "acc_step": 0, "speed/wps": 5510.8735218163, "speed/FLOPS": 243552402456550.5, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04966692999005318, "optim/lr": 2.053488607199805e-05, "optim/total_tokens": 1956324048896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.278212070465088, "created_at": "2025-06-03T06:18:29.530702+00:00"} {"global_step": 233213, "acc_step": 0, "speed/wps": 5498.175561659236, "speed/FLOPS": 242991217611660.22, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.79 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.79, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04951023310422897, "optim/lr": 2.0531338846903502e-05, "optim/total_tokens": 1956332437504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2804149389266968, "created_at": "2025-06-03T06:18:32.517850+00:00"} {"global_step": 233214, "acc_step": 0, "speed/wps": 5525.30125621241, "speed/FLOPS": 244190034469019.47, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046504907310009, "optim/lr": 2.0527791621808956e-05, "optim/total_tokens": 1956340826112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2814946174621582, "created_at": "2025-06-03T06:18:35.486846+00:00"} {"global_step": 233215, "acc_step": 0, "speed/wps": 5519.989336164864, "speed/FLOPS": 243955274791789.44, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04866941273212433, "optim/lr": 2.052424439671463e-05, "optim/total_tokens": 1956349214720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2958664894104004, "created_at": "2025-06-03T06:18:38.458501+00:00"} {"global_step": 233216, "acc_step": 0, "speed/wps": 5509.442334841092, "speed/FLOPS": 243489151317725.3, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04500376433134079, "optim/lr": 2.0520697171620083e-05, "optim/total_tokens": 1956357603328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2918224334716797, "created_at": "2025-06-03T06:18:41.440128+00:00"} {"global_step": 233217, "acc_step": 0, "speed/wps": 5510.616837026155, "speed/FLOPS": 243541058302657.94, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04495168477296829, "optim/lr": 2.0517149946525537e-05, "optim/total_tokens": 1956365991936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2829227447509766, "created_at": "2025-06-03T06:18:44.420091+00:00"} {"global_step": 233218, "acc_step": 0, "speed/wps": 5512.092471247097, "speed/FLOPS": 243606273782242.94, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0464114211499691, "optim/lr": 2.051360272143099e-05, "optim/total_tokens": 1956374380544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2821173667907715, "created_at": "2025-06-03T06:18:47.400173+00:00"} {"global_step": 233219, "acc_step": 0, "speed/wps": 5506.425845371129, "speed/FLOPS": 243355837922945.72, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04780741035938263, "optim/lr": 2.0510055496336668e-05, "optim/total_tokens": 1956382769152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.288272500038147, "created_at": "2025-06-03T06:18:50.381713+00:00"} {"global_step": 233220, "acc_step": 0, "speed/wps": 5509.786585916812, "speed/FLOPS": 243504365453235.4, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04484567791223526, "optim/lr": 2.0506508271242118e-05, "optim/total_tokens": 1956391157760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2626352310180664, "created_at": "2025-06-03T06:18:53.359127+00:00"} {"global_step": 233221, "acc_step": 0, "speed/wps": 5495.191630311288, "speed/FLOPS": 242859343119226.06, "speed/curr_iter_time": 2.9793, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9793, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.78 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.78, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04456290975213051, "optim/lr": 2.050296104614757e-05, "optim/total_tokens": 1956399546368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2831101417541504, "created_at": "2025-06-03T06:18:56.344286+00:00"} {"global_step": 233222, "acc_step": 0, "speed/wps": 5515.062133049499, "speed/FLOPS": 243737517633802.06, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043855588883161545, "optim/lr": 2.0499413821053025e-05, "optim/total_tokens": 1956407934976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2687320709228516, "created_at": "2025-06-03T06:18:59.321133+00:00"} {"global_step": 233223, "acc_step": 0, "speed/wps": 5520.03557539204, "speed/FLOPS": 243957318328956.8, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043601203709840775, "optim/lr": 2.0495866595958702e-05, "optim/total_tokens": 1956416323584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2874782085418701, "created_at": "2025-06-03T06:19:02.293352+00:00"} {"global_step": 233224, "acc_step": 0, "speed/wps": 5508.048574983898, "speed/FLOPS": 243427554265947.0, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045728787779808044, "optim/lr": 2.0492319370864156e-05, "optim/total_tokens": 1956424712192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.3014030456542969, "created_at": "2025-06-03T06:19:05.273783+00:00"} {"global_step": 233225, "acc_step": 0, "speed/wps": 5509.478986079767, "speed/FLOPS": 243490771114876.72, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043165333569049835, "optim/lr": 2.0488772145769606e-05, "optim/total_tokens": 1956433100800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2968605756759644, "created_at": "2025-06-03T06:19:08.252506+00:00"} {"global_step": 233226, "acc_step": 0, "speed/wps": 5511.086635520069, "speed/FLOPS": 243561820991442.25, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046886131167411804, "optim/lr": 2.0485224920675283e-05, "optim/total_tokens": 1956441489408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2887752056121826, "created_at": "2025-06-03T06:19:11.233595+00:00"} {"global_step": 233227, "acc_step": 0, "speed/wps": 5498.4210005032755, "speed/FLOPS": 243002064752296.84, "speed/curr_iter_time": 2.9774, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9774, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042979080229997635, "optim/lr": 2.0481677695580737e-05, "optim/total_tokens": 1956449878016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.278861403465271, "created_at": "2025-06-03T06:19:14.217272+00:00"} {"global_step": 233228, "acc_step": 0, "speed/wps": 5513.076214874068, "speed/FLOPS": 243649750215298.72, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04383400082588196, "optim/lr": 2.047813047048619e-05, "optim/total_tokens": 1956458266624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.284935474395752, "created_at": "2025-06-03T06:19:17.195426+00:00"} {"global_step": 233229, "acc_step": 0, "speed/wps": 5502.485468457233, "speed/FLOPS": 243181693432028.88, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04413102567195892, "optim/lr": 2.0474583245391644e-05, "optim/total_tokens": 1956466655232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2812515497207642, "created_at": "2025-06-03T06:19:20.178695+00:00"} {"global_step": 233230, "acc_step": 0, "speed/wps": 5520.944171290833, "speed/FLOPS": 243997473617068.06, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04312998428940773, "optim/lr": 2.0471036020297318e-05, "optim/total_tokens": 1956475043840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.293712854385376, "created_at": "2025-06-03T06:19:23.149577+00:00"} {"global_step": 233231, "acc_step": 0, "speed/wps": 5525.023412699745, "speed/FLOPS": 244177755207891.66, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.048000603914260864, "optim/lr": 2.046748879520277e-05, "optim/total_tokens": 1956483432448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.289117455482483, "created_at": "2025-06-03T06:19:26.121512+00:00"} {"global_step": 233232, "acc_step": 0, "speed/wps": 5524.521286660138, "speed/FLOPS": 244155563807055.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04633065313100815, "optim/lr": 2.0463941570108225e-05, "optim/total_tokens": 1956491821056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2810218334197998, "created_at": "2025-06-03T06:19:29.093803+00:00"} {"global_step": 233233, "acc_step": 0, "speed/wps": 5526.058836979909, "speed/FLOPS": 244223515661293.0, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04422452673316002, "optim/lr": 2.046039434501368e-05, "optim/total_tokens": 1956500209664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2884490489959717, "created_at": "2025-06-03T06:19:32.061985+00:00"} {"global_step": 233234, "acc_step": 0, "speed/wps": 5507.870026501107, "speed/FLOPS": 243419663336901.6, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04424801468849182, "optim/lr": 2.0456847119919353e-05, "optim/total_tokens": 1956508598272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2779394388198853, "created_at": "2025-06-03T06:19:35.040167+00:00"} {"global_step": 233235, "acc_step": 0, "speed/wps": 5519.194009793832, "speed/FLOPS": 243920125437039.25, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043563611805438995, "optim/lr": 2.0453299894824806e-05, "optim/total_tokens": 1956516986880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2759679555892944, "created_at": "2025-06-03T06:19:38.012340+00:00"} {"global_step": 233236, "acc_step": 0, "speed/wps": 5493.749010663131, "speed/FLOPS": 242795586714774.28, "speed/curr_iter_time": 2.979, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.979, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.77 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.77, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043256159871816635, "optim/lr": 2.044975266973026e-05, "optim/total_tokens": 1956525375488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2843527793884277, "created_at": "2025-06-03T06:19:40.998510+00:00"} {"global_step": 233237, "acc_step": 0, "speed/wps": 5511.313106207652, "speed/FLOPS": 243571829836651.34, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04288576915860176, "optim/lr": 2.0446205444635713e-05, "optim/total_tokens": 1956533764096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2853657007217407, "created_at": "2025-06-03T06:19:43.974706+00:00"} {"global_step": 233238, "acc_step": 0, "speed/wps": 5508.5821669934385, "speed/FLOPS": 243451136301597.2, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04583914577960968, "optim/lr": 2.0442658219541387e-05, "optim/total_tokens": 1956542152704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2907205820083618, "created_at": "2025-06-03T06:19:46.956517+00:00"} {"global_step": 233239, "acc_step": 0, "speed/wps": 5520.303333436143, "speed/FLOPS": 243969151863996.22, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046763788908720016, "optim/lr": 2.043911099444684e-05, "optim/total_tokens": 1956550541312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2711254358291626, "created_at": "2025-06-03T06:19:49.932639+00:00"} {"global_step": 233240, "acc_step": 0, "speed/wps": 5528.320085124167, "speed/FLOPS": 244323451255152.0, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04638697952032089, "optim/lr": 2.0435563769352294e-05, "optim/total_tokens": 1956558929920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2815114259719849, "created_at": "2025-06-03T06:19:52.901448+00:00"} {"global_step": 233241, "acc_step": 0, "speed/wps": 5519.26959020848, "speed/FLOPS": 243923465704511.03, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05067868530750275, "optim/lr": 2.0432016544257748e-05, "optim/total_tokens": 1956567318528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2800832986831665, "created_at": "2025-06-03T06:19:55.873351+00:00"} {"global_step": 233242, "acc_step": 0, "speed/wps": 5513.776152426614, "speed/FLOPS": 243680683872516.1, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04540345072746277, "optim/lr": 2.0428469319163422e-05, "optim/total_tokens": 1956575707136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2935271263122559, "created_at": "2025-06-03T06:19:58.848505+00:00"} {"global_step": 233243, "acc_step": 0, "speed/wps": 5519.928217655893, "speed/FLOPS": 243952573666525.8, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.22, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.048309482634067535, "optim/lr": 2.0424922094068875e-05, "optim/total_tokens": 1956584095744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.300165057182312, "created_at": "2025-06-03T06:20:01.820426+00:00"} {"global_step": 233244, "acc_step": 0, "speed/wps": 5522.123405802029, "speed/FLOPS": 244049589746593.53, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04336344450712204, "optim/lr": 2.042137486897433e-05, "optim/total_tokens": 1956592484352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2821598052978516, "created_at": "2025-06-03T06:20:04.790826+00:00"} {"global_step": 233245, "acc_step": 0, "speed/wps": 5499.614598165943, "speed/FLOPS": 243054815659600.1, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04758952930569649, "optim/lr": 2.0417827643879783e-05, "optim/total_tokens": 1956600872960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2829550504684448, "created_at": "2025-06-03T06:20:07.773402+00:00"} {"global_step": 233246, "acc_step": 0, "speed/wps": 5497.284186876251, "speed/FLOPS": 242951823408722.0, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.76 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.76, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04407894238829613, "optim/lr": 2.0414280418785456e-05, "optim/total_tokens": 1956609261568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2799674272537231, "created_at": "2025-06-03T06:20:10.757165+00:00"} {"global_step": 233247, "acc_step": 0, "speed/wps": 5516.546018733776, "speed/FLOPS": 243803097785831.66, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05354665592312813, "optim/lr": 2.041073319369091e-05, "optim/total_tokens": 1956617650176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2922358512878418, "created_at": "2025-06-03T06:20:13.733099+00:00"} {"global_step": 233248, "acc_step": 0, "speed/wps": 5519.792005974606, "speed/FLOPS": 243946553807407.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04395684227347374, "optim/lr": 2.0407185968596364e-05, "optim/total_tokens": 1956626038784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2907525300979614, "created_at": "2025-06-03T06:20:16.710492+00:00"} {"global_step": 233249, "acc_step": 0, "speed/wps": 5510.532055908021, "speed/FLOPS": 243537311411185.53, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04885363206267357, "optim/lr": 2.0403638743501817e-05, "optim/total_tokens": 1956634427392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.284083366394043, "created_at": "2025-06-03T06:20:19.690317+00:00"} {"global_step": 233250, "acc_step": 0, "speed/wps": 5516.13854740738, "speed/FLOPS": 243785089638832.3, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045302826911211014, "optim/lr": 2.0400091518407495e-05, "optim/total_tokens": 1956642816000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2718604803085327, "created_at": "2025-06-03T06:20:22.667469+00:00"} {"global_step": 233251, "acc_step": 0, "speed/wps": 5516.086935185641, "speed/FLOPS": 243782808642806.72, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.047048892825841904, "optim/lr": 2.0396544293312945e-05, "optim/total_tokens": 1956651204608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2812362909317017, "created_at": "2025-06-03T06:20:25.645620+00:00"} {"global_step": 233252, "acc_step": 0, "speed/wps": 5511.726896227097, "speed/FLOPS": 243590117237541.53, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04484452307224274, "optim/lr": 2.03929970682184e-05, "optim/total_tokens": 1956659593216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.283154010772705, "created_at": "2025-06-03T06:20:28.621327+00:00"} {"global_step": 233253, "acc_step": 0, "speed/wps": 5503.490263322959, "speed/FLOPS": 243226100222087.62, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044197868555784225, "optim/lr": 2.0389449843124076e-05, "optim/total_tokens": 1956667981824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2981927394866943, "created_at": "2025-06-03T06:20:31.606385+00:00"} {"global_step": 233254, "acc_step": 0, "speed/wps": 5507.94952251088, "speed/FLOPS": 243423176653636.12, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044870179146528244, "optim/lr": 2.038590261802953e-05, "optim/total_tokens": 1956676370432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2670254707336426, "created_at": "2025-06-03T06:20:34.588365+00:00"} {"global_step": 233255, "acc_step": 0, "speed/wps": 5509.680909860449, "speed/FLOPS": 243499695112443.25, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04398668557405472, "optim/lr": 2.0382355392934983e-05, "optim/total_tokens": 1956684759040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.285735011100769, "created_at": "2025-06-03T06:20:37.569714+00:00"} {"global_step": 233256, "acc_step": 0, "speed/wps": 5515.191581717652, "speed/FLOPS": 243743238602356.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04351797699928284, "optim/lr": 2.0378808167840436e-05, "optim/total_tokens": 1956693147648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2925269603729248, "created_at": "2025-06-03T06:20:40.545440+00:00"} {"global_step": 233257, "acc_step": 0, "speed/wps": 5525.670352442016, "speed/FLOPS": 244206346633162.28, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04348915070295334, "optim/lr": 2.037526094274611e-05, "optim/total_tokens": 1956701536256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2809892892837524, "created_at": "2025-06-03T06:20:43.513993+00:00"} {"global_step": 233258, "acc_step": 0, "speed/wps": 5521.489026781784, "speed/FLOPS": 244021553440944.88, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04479258507490158, "optim/lr": 2.0371713717651564e-05, "optim/total_tokens": 1956709924864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2908529043197632, "created_at": "2025-06-03T06:20:46.488690+00:00"} {"global_step": 233259, "acc_step": 0, "speed/wps": 5502.564479945705, "speed/FLOPS": 243185185335401.88, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043754708021879196, "optim/lr": 2.0368166492557017e-05, "optim/total_tokens": 1956718313472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2835642099380493, "created_at": "2025-06-03T06:20:49.470259+00:00"} {"global_step": 233260, "acc_step": 0, "speed/wps": 5508.494555930553, "speed/FLOPS": 243447264341051.72, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.74 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.74, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04365614429116249, "optim/lr": 2.036461926746247e-05, "optim/total_tokens": 1956726702080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2849106788635254, "created_at": "2025-06-03T06:20:52.448254+00:00"} {"global_step": 233261, "acc_step": 0, "speed/wps": 5494.502649390738, "speed/FLOPS": 242828893689061.8, "speed/curr_iter_time": 2.9805, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9805, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.75 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.75, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04359012097120285, "optim/lr": 2.0361072042368145e-05, "optim/total_tokens": 1956735090688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3042927980422974, "created_at": "2025-06-03T06:20:55.433659+00:00"} {"global_step": 233262, "acc_step": 0, "speed/wps": 5515.39374073679, "speed/FLOPS": 243752172996258.34, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04513200744986534, "optim/lr": 2.03575248172736e-05, "optim/total_tokens": 1956743479296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2956194877624512, "created_at": "2025-06-03T06:20:58.407866+00:00"} {"global_step": 233263, "acc_step": 0, "speed/wps": 5507.906149831884, "speed/FLOPS": 243421259803226.0, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04263734817504883, "optim/lr": 2.0353977592179052e-05, "optim/total_tokens": 1956751867904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.29230797290802, "created_at": "2025-06-03T06:21:01.386417+00:00"} {"global_step": 233264, "acc_step": 0, "speed/wps": 5514.7974733334795, "speed/FLOPS": 243725821029005.25, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04833992198109627, "optim/lr": 2.0350430367084506e-05, "optim/total_tokens": 1956760256512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.278467059135437, "created_at": "2025-06-03T06:21:04.364870+00:00"} {"global_step": 233265, "acc_step": 0, "speed/wps": 5525.446971274798, "speed/FLOPS": 244196474328939.7, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04338056221604347, "optim/lr": 2.034688314199018e-05, "optim/total_tokens": 1956768645120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2851976156234741, "created_at": "2025-06-03T06:21:07.339500+00:00"} {"global_step": 233266, "acc_step": 0, "speed/wps": 5513.686889056905, "speed/FLOPS": 243676738888466.28, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04459603875875473, "optim/lr": 2.0343335916895633e-05, "optim/total_tokens": 1956777033728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2775001525878906, "created_at": "2025-06-03T06:21:10.314789+00:00"} {"global_step": 233267, "acc_step": 0, "speed/wps": 5517.133749233875, "speed/FLOPS": 243829072465658.66, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04348932206630707, "optim/lr": 2.0339788691801087e-05, "optim/total_tokens": 1956785422336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2949010133743286, "created_at": "2025-06-03T06:21:13.288064+00:00"} {"global_step": 233268, "acc_step": 0, "speed/wps": 5523.890872776815, "speed/FLOPS": 244127702740162.97, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04464825615286827, "optim/lr": 2.033624146670654e-05, "optim/total_tokens": 1956793810944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.275212287902832, "created_at": "2025-06-03T06:21:16.260760+00:00"} {"global_step": 233269, "acc_step": 0, "speed/wps": 5517.460864664902, "speed/FLOPS": 243843529293381.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045118313282728195, "optim/lr": 2.0332694241612214e-05, "optim/total_tokens": 1956802199552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2897709608078003, "created_at": "2025-06-03T06:21:19.236936+00:00"} {"global_step": 233270, "acc_step": 0, "speed/wps": 5520.088199030219, "speed/FLOPS": 243959644024412.1, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04763660207390785, "optim/lr": 2.0329147016517668e-05, "optim/total_tokens": 1956810588160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2964977025985718, "created_at": "2025-06-03T06:21:22.208879+00:00"} {"global_step": 233271, "acc_step": 0, "speed/wps": 5506.100509258669, "speed/FLOPS": 243341459731996.16, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04541059955954552, "optim/lr": 2.032559979142312e-05, "optim/total_tokens": 1956818976768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3075203895568848, "created_at": "2025-06-03T06:21:25.188310+00:00"} {"global_step": 233272, "acc_step": 0, "speed/wps": 5506.163760506341, "speed/FLOPS": 243344255113394.0, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.051370635628700256, "optim/lr": 2.0322052566328575e-05, "optim/total_tokens": 1956827365376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2827509641647339, "created_at": "2025-06-03T06:21:28.168022+00:00"} {"global_step": 233273, "acc_step": 0, "speed/wps": 5523.044198719771, "speed/FLOPS": 244090284080512.3, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0436917282640934, "optim/lr": 2.031850534123425e-05, "optim/total_tokens": 1956835753984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.296887993812561, "created_at": "2025-06-03T06:21:31.138336+00:00"} {"global_step": 233274, "acc_step": 0, "speed/wps": 5508.604812224078, "speed/FLOPS": 243452137104882.66, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04751046374440193, "optim/lr": 2.0314958116139702e-05, "optim/total_tokens": 1956844142592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2736035585403442, "created_at": "2025-06-03T06:21:34.118823+00:00"} {"global_step": 233275, "acc_step": 0, "speed/wps": 5530.235286897993, "speed/FLOPS": 244408093370663.78, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04349320009350777, "optim/lr": 2.0311410891045156e-05, "optim/total_tokens": 1956852531200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2648770809173584, "created_at": "2025-06-03T06:21:37.087536+00:00"} {"global_step": 233276, "acc_step": 0, "speed/wps": 5514.7305539982035, "speed/FLOPS": 243722863536910.25, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04881836846470833, "optim/lr": 2.030786366595061e-05, "optim/total_tokens": 1956860919808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.261851191520691, "created_at": "2025-06-03T06:21:40.062115+00:00"} {"global_step": 233277, "acc_step": 0, "speed/wps": 5519.048525649762, "speed/FLOPS": 243913695782526.7, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04360511526465416, "optim/lr": 2.0304316440856287e-05, "optim/total_tokens": 1956869308416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2817569971084595, "created_at": "2025-06-03T06:21:43.037885+00:00"} {"global_step": 233278, "acc_step": 0, "speed/wps": 5505.080516153447, "speed/FLOPS": 243296381257543.34, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.73 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.73, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.050777532160282135, "optim/lr": 2.0300769215761737e-05, "optim/total_tokens": 1956877697024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2823140621185303, "created_at": "2025-06-03T06:21:46.018179+00:00"} {"global_step": 233279, "acc_step": 0, "speed/wps": 5510.690945882384, "speed/FLOPS": 243544333534779.75, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04312625899910927, "optim/lr": 2.029722199066719e-05, "optim/total_tokens": 1956886085632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2946410179138184, "created_at": "2025-06-03T06:21:48.998897+00:00"} {"global_step": 233280, "acc_step": 0, "speed/wps": 5510.91169401731, "speed/FLOPS": 243554089472452.1, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046912502497434616, "optim/lr": 2.0293674765572868e-05, "optim/total_tokens": 1956894474240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2714741230010986, "created_at": "2025-06-03T06:21:51.976014+00:00"} {"global_step": 233281, "acc_step": 0, "speed/wps": 5526.060222185386, "speed/FLOPS": 244223576880284.97, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04398558288812637, "optim/lr": 2.029012754047832e-05, "optim/total_tokens": 1956902862848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2725505828857422, "created_at": "2025-06-03T06:21:54.951152+00:00"} {"global_step": 233282, "acc_step": 0, "speed/wps": 5517.629621879772, "speed/FLOPS": 243850987498500.97, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04923611134290695, "optim/lr": 2.0286580315383775e-05, "optim/total_tokens": 1956911251456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2952265739440918, "created_at": "2025-06-03T06:21:57.924673+00:00"} {"global_step": 233283, "acc_step": 0, "speed/wps": 5517.944698132583, "speed/FLOPS": 243864912256168.78, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045549176633358, "optim/lr": 2.0283033090289225e-05, "optim/total_tokens": 1956919640064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2759162187576294, "created_at": "2025-06-03T06:22:00.898306+00:00"} {"global_step": 233284, "acc_step": 0, "speed/wps": 5515.275604127106, "speed/FLOPS": 243746951962788.28, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05994663015007973, "optim/lr": 2.0279485865194903e-05, "optim/total_tokens": 1956928028672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.3058406114578247, "created_at": "2025-06-03T06:22:03.872508+00:00"} {"global_step": 233285, "acc_step": 0, "speed/wps": 5526.847330378652, "speed/FLOPS": 244258363033642.38, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04498278722167015, "optim/lr": 2.0275938640100356e-05, "optim/total_tokens": 1956936417280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2768553495407104, "created_at": "2025-06-03T06:22:06.841715+00:00"} {"global_step": 233286, "acc_step": 0, "speed/wps": 5514.761629075194, "speed/FLOPS": 243724236896256.56, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05094388872385025, "optim/lr": 2.027239141500581e-05, "optim/total_tokens": 1956944805888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.299132227897644, "created_at": "2025-06-03T06:22:09.816262+00:00"} {"global_step": 233287, "acc_step": 0, "speed/wps": 5509.2863882304955, "speed/FLOPS": 243482259275744.06, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044384658336639404, "optim/lr": 2.0268844189911263e-05, "optim/total_tokens": 1956953194496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.274983286857605, "created_at": "2025-06-03T06:22:12.794432+00:00"} {"global_step": 233288, "acc_step": 0, "speed/wps": 5525.921805315217, "speed/FLOPS": 244217459563105.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05509193241596222, "optim/lr": 2.0265296964816937e-05, "optim/total_tokens": 1956961583104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2835097312927246, "created_at": "2025-06-03T06:22:15.763130+00:00"} {"global_step": 233289, "acc_step": 0, "speed/wps": 5506.661437085797, "speed/FLOPS": 243366249870866.3, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043206844478845596, "optim/lr": 2.026174973972239e-05, "optim/total_tokens": 1956969971712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2923609018325806, "created_at": "2025-06-03T06:22:18.741921+00:00"} {"global_step": 233290, "acc_step": 0, "speed/wps": 5510.425703126661, "speed/FLOPS": 243532611162612.28, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05205091834068298, "optim/lr": 2.0258202514627844e-05, "optim/total_tokens": 1956978360320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2907875776290894, "created_at": "2025-06-03T06:22:21.720913+00:00"} {"global_step": 233291, "acc_step": 0, "speed/wps": 5522.230300743967, "speed/FLOPS": 244054313955889.28, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.13, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04390212148427963, "optim/lr": 2.0254655289533298e-05, "optim/total_tokens": 1956986748928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2902227640151978, "created_at": "2025-06-03T06:22:24.691622+00:00"} {"global_step": 233292, "acc_step": 0, "speed/wps": 5516.426404374608, "speed/FLOPS": 243797811443398.22, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05169474333524704, "optim/lr": 2.0251108064438972e-05, "optim/total_tokens": 1956995137536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2898459434509277, "created_at": "2025-06-03T06:22:27.664921+00:00"} {"global_step": 233293, "acc_step": 0, "speed/wps": 5519.322775438423, "speed/FLOPS": 243925816219447.84, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044323600828647614, "optim/lr": 2.0247560839344425e-05, "optim/total_tokens": 1957003526144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.278899908065796, "created_at": "2025-06-03T06:22:30.642441+00:00"} {"global_step": 233294, "acc_step": 0, "speed/wps": 5507.278975903992, "speed/FLOPS": 243393541925780.34, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.71 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.71, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043659526854753494, "optim/lr": 2.024401361424988e-05, "optim/total_tokens": 1957011914752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2989411354064941, "created_at": "2025-06-03T06:22:33.621931+00:00"} {"global_step": 233295, "acc_step": 0, "speed/wps": 5494.062607217375, "speed/FLOPS": 242809446077339.22, "speed/curr_iter_time": 2.9799, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9799, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0453118272125721, "optim/lr": 2.0240466389155333e-05, "optim/total_tokens": 1957020303360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2869678735733032, "created_at": "2025-06-03T06:22:36.611453+00:00"} {"global_step": 233296, "acc_step": 0, "speed/wps": 5497.185168609273, "speed/FLOPS": 242947447308143.0, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.72 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.72, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04281800240278244, "optim/lr": 2.0236919164061007e-05, "optim/total_tokens": 1957028691968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2717514038085938, "created_at": "2025-06-03T06:22:39.599469+00:00"} {"global_step": 233297, "acc_step": 0, "speed/wps": 5528.637035071334, "speed/FLOPS": 244337458820519.88, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.051094282418489456, "optim/lr": 2.023337193896646e-05, "optim/total_tokens": 1957037080576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2781660556793213, "created_at": "2025-06-03T06:22:42.570548+00:00"} {"global_step": 233298, "acc_step": 0, "speed/wps": 5522.440086351366, "speed/FLOPS": 244063585405956.22, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.042916662991046906, "optim/lr": 2.0229824713871914e-05, "optim/total_tokens": 1957045469184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2938954830169678, "created_at": "2025-06-03T06:22:45.546080+00:00"} {"global_step": 233299, "acc_step": 0, "speed/wps": 5515.546134703095, "speed/FLOPS": 243758908029545.97, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.055323027074337006, "optim/lr": 2.0226277488777367e-05, "optim/total_tokens": 1957053857792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3008606433868408, "created_at": "2025-06-03T06:22:48.520914+00:00"} {"global_step": 233300, "acc_step": 0, "speed/wps": 5514.761842144369, "speed/FLOPS": 243724246312823.53, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04429718852043152, "optim/lr": 2.022273026368304e-05, "optim/total_tokens": 1957062246400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2880361080169678, "created_at": "2025-06-03T06:22:51.495108+00:00"} {"global_step": 233301, "acc_step": 0, "speed/wps": 5517.073827228157, "speed/FLOPS": 243826424219714.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05504675209522247, "optim/lr": 2.0219183038588495e-05, "optim/total_tokens": 1957070635008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.3007962703704834, "created_at": "2025-06-03T06:22:54.468903+00:00"} {"global_step": 233302, "acc_step": 0, "speed/wps": 5523.391501791859, "speed/FLOPS": 244105633098640.34, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044864241033792496, "optim/lr": 2.021563581349395e-05, "optim/total_tokens": 1957079023616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2857351303100586, "created_at": "2025-06-03T06:22:57.438444+00:00"} {"global_step": 233303, "acc_step": 0, "speed/wps": 5509.660736703405, "speed/FLOPS": 243498803562157.47, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.050189271569252014, "optim/lr": 2.0212088588399402e-05, "optim/total_tokens": 1957087412224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2861478328704834, "created_at": "2025-06-03T06:23:00.415615+00:00"} {"global_step": 233304, "acc_step": 0, "speed/wps": 5511.690633830946, "speed/FLOPS": 243588514625239.44, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.7 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.7, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04401196166872978, "optim/lr": 2.0208541363305076e-05, "optim/total_tokens": 1957095800832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2712222337722778, "created_at": "2025-06-03T06:23:03.391744+00:00"} {"global_step": 233305, "acc_step": 0, "speed/wps": 5516.914836271583, "speed/FLOPS": 243819397633223.47, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.048509903252124786, "optim/lr": 2.020499413821053e-05, "optim/total_tokens": 1957104189440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2915982007980347, "created_at": "2025-06-03T06:23:06.367993+00:00"} {"global_step": 233306, "acc_step": 0, "speed/wps": 5538.565234086056, "speed/FLOPS": 244776234399841.34, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 191.52, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.053154077380895615, "optim/lr": 2.0201446913115983e-05, "optim/total_tokens": 1957112578048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.287754774093628, "created_at": "2025-06-03T06:23:09.329882+00:00"} {"global_step": 233307, "acc_step": 0, "speed/wps": 5524.126450940139, "speed/FLOPS": 244138114089183.56, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046738140285015106, "optim/lr": 2.019789968802166e-05, "optim/total_tokens": 1957120966656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2962933778762817, "created_at": "2025-06-03T06:23:12.299410+00:00"} {"global_step": 233308, "acc_step": 0, "speed/wps": 5520.894258880147, "speed/FLOPS": 243995267743990.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05670108273625374, "optim/lr": 2.0194352462927114e-05, "optim/total_tokens": 1957129355264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2663555145263672, "created_at": "2025-06-03T06:23:15.270442+00:00"} {"global_step": 233309, "acc_step": 0, "speed/wps": 5527.753572663991, "speed/FLOPS": 244298414304085.84, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.045956533402204514, "optim/lr": 2.0190805237832564e-05, "optim/total_tokens": 1957137743872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2987232208251953, "created_at": "2025-06-03T06:23:18.242003+00:00"} {"global_step": 233310, "acc_step": 0, "speed/wps": 5525.929844933017, "speed/FLOPS": 244217814873061.53, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 191.95, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.050832346081733704, "optim/lr": 2.0187258012738018e-05, "optim/total_tokens": 1957146132480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2814456224441528, "created_at": "2025-06-03T06:23:21.212793+00:00"} {"global_step": 233311, "acc_step": 0, "speed/wps": 5526.3881921659095, "speed/FLOPS": 244238071474721.56, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04302855581045151, "optim/lr": 2.0183710787643695e-05, "optim/total_tokens": 1957154521088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2719141244888306, "created_at": "2025-06-03T06:23:24.184343+00:00"} {"global_step": 233312, "acc_step": 0, "speed/wps": 5515.952671917438, "speed/FLOPS": 243776874893573.84, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05117795616388321, "optim/lr": 2.018016356254915e-05, "optim/total_tokens": 1957162909696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.290327548980713, "created_at": "2025-06-03T06:23:27.158097+00:00"} {"global_step": 233313, "acc_step": 0, "speed/wps": 5513.039188796803, "speed/FLOPS": 243648113852200.22, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04352103918790817, "optim/lr": 2.0176616337454602e-05, "optim/total_tokens": 1957171298304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.3044276237487793, "created_at": "2025-06-03T06:23:30.136527+00:00"} {"global_step": 233314, "acc_step": 0, "speed/wps": 5517.241858693732, "speed/FLOPS": 243833850350429.94, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0460839606821537, "optim/lr": 2.0173069112360056e-05, "optim/total_tokens": 1957179686912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2907077074050903, "created_at": "2025-06-03T06:23:33.113886+00:00"} {"global_step": 233315, "acc_step": 0, "speed/wps": 5519.469933884349, "speed/FLOPS": 243932319869532.56, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.25, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04641242325305939, "optim/lr": 2.016952188726573e-05, "optim/total_tokens": 1957188075520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.281516194343567, "created_at": "2025-06-03T06:23:36.086458+00:00"} {"global_step": 233316, "acc_step": 0, "speed/wps": 5521.977112435568, "speed/FLOPS": 244043124328593.3, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04420017823576927, "optim/lr": 2.0165974662171183e-05, "optim/total_tokens": 1957196464128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2912638187408447, "created_at": "2025-06-03T06:23:39.062265+00:00"} {"global_step": 233317, "acc_step": 0, "speed/wps": 5525.503480653394, "speed/FLOPS": 244198971754232.4, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.03, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05088222399353981, "optim/lr": 2.0162427437076637e-05, "optim/total_tokens": 1957204852736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2838770151138306, "created_at": "2025-06-03T06:23:42.030913+00:00"} {"global_step": 233318, "acc_step": 0, "speed/wps": 5528.83605725325, "speed/FLOPS": 244346254582272.72, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04264754056930542, "optim/lr": 2.015888021198209e-05, "optim/total_tokens": 1957213241344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2967506647109985, "created_at": "2025-06-03T06:23:44.997542+00:00"} {"global_step": 233319, "acc_step": 0, "speed/wps": 5520.842820110463, "speed/FLOPS": 243992994413658.1, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05404997989535332, "optim/lr": 2.0155332986887764e-05, "optim/total_tokens": 1957221629952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2952449321746826, "created_at": "2025-06-03T06:23:47.968749+00:00"} {"global_step": 233320, "acc_step": 0, "speed/wps": 5513.59605607393, "speed/FLOPS": 243672724535544.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0432475320994854, "optim/lr": 2.0151785761793218e-05, "optim/total_tokens": 1957230018560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2832022905349731, "created_at": "2025-06-03T06:23:50.943602+00:00"} {"global_step": 233321, "acc_step": 0, "speed/wps": 5508.5257565386555, "speed/FLOPS": 243448643248230.66, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04816916212439537, "optim/lr": 2.014823853669867e-05, "optim/total_tokens": 1957238407168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2937428951263428, "created_at": "2025-06-03T06:23:53.922395+00:00"} {"global_step": 233322, "acc_step": 0, "speed/wps": 5506.067029898566, "speed/FLOPS": 243339980115642.5, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04793785512447357, "optim/lr": 2.0144691311604125e-05, "optim/total_tokens": 1957246795776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.287741780281067, "created_at": "2025-06-03T06:23:56.902130+00:00"} {"global_step": 233323, "acc_step": 0, "speed/wps": 5511.630397872369, "speed/FLOPS": 243585852504185.9, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.05372188985347748, "optim/lr": 2.01411440865098e-05, "optim/total_tokens": 1957255184384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2811815738677979, "created_at": "2025-06-03T06:23:59.880713+00:00"} {"global_step": 233324, "acc_step": 0, "speed/wps": 5515.160880879607, "speed/FLOPS": 243741881782455.66, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04336341470479965, "optim/lr": 2.0137596861415252e-05, "optim/total_tokens": 1957263572992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2789191007614136, "created_at": "2025-06-03T06:24:02.854541+00:00"} {"global_step": 233325, "acc_step": 0, "speed/wps": 5522.56890989022, "speed/FLOPS": 244069278746994.94, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045749060809612274, "optim/lr": 2.0134049636320706e-05, "optim/total_tokens": 1957271961600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2990931272506714, "created_at": "2025-06-03T06:24:05.826636+00:00"} {"global_step": 233326, "acc_step": 0, "speed/wps": 5519.708276266542, "speed/FLOPS": 243942853382878.6, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.042842913419008255, "optim/lr": 2.013050241122616e-05, "optim/total_tokens": 1957280350208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2840989828109741, "created_at": "2025-06-03T06:24:08.804085+00:00"} {"global_step": 233327, "acc_step": 0, "speed/wps": 5504.650081475618, "speed/FLOPS": 243277358247947.7, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.69 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.69, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04342417046427727, "optim/lr": 2.0126955186131834e-05, "optim/total_tokens": 1957288738816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.280572533607483, "created_at": "2025-06-03T06:24:11.784733+00:00"} {"global_step": 233328, "acc_step": 0, "speed/wps": 5510.937802489762, "speed/FLOPS": 243555243333299.22, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.046227216720581055, "optim/lr": 2.0123407961037287e-05, "optim/total_tokens": 1957297127424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2791919708251953, "created_at": "2025-06-03T06:24:14.760823+00:00"} {"global_step": 233329, "acc_step": 0, "speed/wps": 5509.318114981331, "speed/FLOPS": 243483661435738.75, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.0432598777115345, "optim/lr": 2.011986073594274e-05, "optim/total_tokens": 1957305516032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2788383960723877, "created_at": "2025-06-03T06:24:17.742320+00:00"} {"global_step": 233330, "acc_step": 0, "speed/wps": 5504.990060394793, "speed/FLOPS": 243292383576005.34, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.044198695570230484, "optim/lr": 2.0116313510848194e-05, "optim/total_tokens": 1957313904640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.294740915298462, "created_at": "2025-06-03T06:24:20.722069+00:00"} {"global_step": 233331, "acc_step": 0, "speed/wps": 5509.410006219471, "speed/FLOPS": 243487722558122.56, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.043680548667907715, "optim/lr": 2.0112766285753868e-05, "optim/total_tokens": 1957322293248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2925798892974854, "created_at": "2025-06-03T06:24:23.704029+00:00"} {"global_step": 233332, "acc_step": 0, "speed/wps": 5517.65481540715, "speed/FLOPS": 243852100923458.94, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044760722666978836, "optim/lr": 2.0109219060659322e-05, "optim/total_tokens": 1957330681856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2852662801742554, "created_at": "2025-06-03T06:24:26.677106+00:00"} {"global_step": 233333, "acc_step": 0, "speed/wps": 5528.533718578473, "speed/FLOPS": 244332892760357.16, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04314470663666725, "optim/lr": 2.0105671835564775e-05, "optim/total_tokens": 1957339070464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.277411937713623, "created_at": "2025-06-03T06:24:29.643615+00:00"} {"global_step": 233334, "acc_step": 0, "speed/wps": 5512.978662053407, "speed/FLOPS": 243645438879946.1, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04461236670613289, "optim/lr": 2.0102124610470453e-05, "optim/total_tokens": 1957347459072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2986164093017578, "created_at": "2025-06-03T06:24:32.618775+00:00"} {"global_step": 233335, "acc_step": 0, "speed/wps": 5525.127743738709, "speed/FLOPS": 244182366105799.22, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043877746909856796, "optim/lr": 2.0098577385375906e-05, "optim/total_tokens": 1957355847680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2757920026779175, "created_at": "2025-06-03T06:24:35.587157+00:00"} {"global_step": 233336, "acc_step": 0, "speed/wps": 5506.205307384307, "speed/FLOPS": 243346091272743.9, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.68 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.68, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043656207621097565, "optim/lr": 2.0095030160281356e-05, "optim/total_tokens": 1957364236288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.300387978553772, "created_at": "2025-06-03T06:24:38.569376+00:00"} {"global_step": 233337, "acc_step": 0, "speed/wps": 5506.79940226112, "speed/FLOPS": 243372347225445.8, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043732888996601105, "optim/lr": 2.009148293518681e-05, "optim/total_tokens": 1957372624896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2933396100997925, "created_at": "2025-06-03T06:24:41.551344+00:00"} {"global_step": 233338, "acc_step": 0, "speed/wps": 5511.765630693542, "speed/FLOPS": 243591829102697.44, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04305582493543625, "optim/lr": 2.0087935710092487e-05, "optim/total_tokens": 1957381013504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2961781024932861, "created_at": "2025-06-03T06:24:44.528531+00:00"} {"global_step": 233339, "acc_step": 0, "speed/wps": 5524.1744542688475, "speed/FLOPS": 244140235590609.16, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04453935846686363, "optim/lr": 2.008438848499794e-05, "optim/total_tokens": 1957389402112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.283238172531128, "created_at": "2025-06-03T06:24:47.498264+00:00"} {"global_step": 233340, "acc_step": 0, "speed/wps": 5509.0511791227655, "speed/FLOPS": 243471864237091.75, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04303146153688431, "optim/lr": 2.0080841259903394e-05, "optim/total_tokens": 1957397790720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2774693965911865, "created_at": "2025-06-03T06:24:50.475810+00:00"} {"global_step": 233341, "acc_step": 0, "speed/wps": 5516.926367020663, "speed/FLOPS": 243819907233313.06, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04500178247690201, "optim/lr": 2.0077294034808845e-05, "optim/total_tokens": 1957406179328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2925573587417603, "created_at": "2025-06-03T06:24:53.452165+00:00"} {"global_step": 233342, "acc_step": 0, "speed/wps": 5508.13967755297, "speed/FLOPS": 243431580533194.75, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04363394156098366, "optim/lr": 2.0073746809714522e-05, "optim/total_tokens": 1957414567936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.28457510471344, "created_at": "2025-06-03T06:24:56.432405+00:00"} {"global_step": 233343, "acc_step": 0, "speed/wps": 5523.27435324166, "speed/FLOPS": 244100455732342.2, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.05, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04464254155755043, "optim/lr": 2.0070199584619975e-05, "optim/total_tokens": 1957422956544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.274962067604065, "created_at": "2025-06-03T06:24:59.406129+00:00"} {"global_step": 233344, "acc_step": 0, "speed/wps": 5525.524577003402, "speed/FLOPS": 244199904104921.84, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04283391311764717, "optim/lr": 2.006665235952543e-05, "optim/total_tokens": 1957431345152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2907979488372803, "created_at": "2025-06-03T06:25:02.378774+00:00"} {"global_step": 233345, "acc_step": 0, "speed/wps": 5515.899085525283, "speed/FLOPS": 243774506649320.62, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046509675681591034, "optim/lr": 2.0063105134430883e-05, "optim/total_tokens": 1957439733760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2954392433166504, "created_at": "2025-06-03T06:25:05.352442+00:00"} {"global_step": 233346, "acc_step": 0, "speed/wps": 5518.819437327343, "speed/FLOPS": 243903571251256.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.66 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.66, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04347081482410431, "optim/lr": 2.0059557909336557e-05, "optim/total_tokens": 1957448122368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2886474132537842, "created_at": "2025-06-03T06:25:08.325460+00:00"} {"global_step": 233347, "acc_step": 0, "speed/wps": 5503.8175097077965, "speed/FLOPS": 243240562837298.6, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.67 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.67, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04281778261065483, "optim/lr": 2.005601068424201e-05, "optim/total_tokens": 1957456510976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2867437601089478, "created_at": "2025-06-03T06:25:11.310262+00:00"} {"global_step": 233348, "acc_step": 0, "speed/wps": 5535.878990970257, "speed/FLOPS": 244657516203561.75, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 191.75, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04427649825811386, "optim/lr": 2.0052463459147464e-05, "optim/total_tokens": 1957464899584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2831661701202393, "created_at": "2025-06-03T06:25:14.273884+00:00"} {"global_step": 233349, "acc_step": 0, "speed/wps": 5532.493044598818, "speed/FLOPS": 244507874704788.75, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04452698305249214, "optim/lr": 2.0048916234052917e-05, "optim/total_tokens": 1957473288192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2955431938171387, "created_at": "2025-06-03T06:25:17.241934+00:00"} {"global_step": 233350, "acc_step": 0, "speed/wps": 5528.012904757636, "speed/FLOPS": 244309875455242.97, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045628730207681656, "optim/lr": 2.004536900895859e-05, "optim/total_tokens": 1957481676800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2879891395568848, "created_at": "2025-06-03T06:25:20.209247+00:00"} {"global_step": 233351, "acc_step": 0, "speed/wps": 5523.178402111282, "speed/FLOPS": 244096215183501.88, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04444832354784012, "optim/lr": 2.0041821783864045e-05, "optim/total_tokens": 1957490065408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.290765404701233, "created_at": "2025-06-03T06:25:23.179419+00:00"} {"global_step": 233352, "acc_step": 0, "speed/wps": 5525.432153075233, "speed/FLOPS": 244195819440365.34, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04419387876987457, "optim/lr": 2.00382745587695e-05, "optim/total_tokens": 1957498454016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2906829118728638, "created_at": "2025-06-03T06:25:26.147906+00:00"} {"global_step": 233353, "acc_step": 0, "speed/wps": 5529.126465268391, "speed/FLOPS": 244359089130098.97, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 191.92, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04584381356835365, "optim/lr": 2.0034727333674952e-05, "optim/total_tokens": 1957506842624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.296691656112671, "created_at": "2025-06-03T06:25:29.117699+00:00"} {"global_step": 233354, "acc_step": 0, "speed/wps": 5522.991636613531, "speed/FLOPS": 244087961104453.78, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04348954185843468, "optim/lr": 2.0031180108580626e-05, "optim/total_tokens": 1957515231232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.280449390411377, "created_at": "2025-06-03T06:25:32.087925+00:00"} {"global_step": 233355, "acc_step": 0, "speed/wps": 5520.927715645837, "speed/FLOPS": 243996746361786.88, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046679187566041946, "optim/lr": 2.002763288348608e-05, "optim/total_tokens": 1957523619840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3012491464614868, "created_at": "2025-06-03T06:25:35.062316+00:00"} {"global_step": 233356, "acc_step": 0, "speed/wps": 5514.887078238018, "speed/FLOPS": 243729781107146.38, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04521660506725311, "optim/lr": 2.0024085658391533e-05, "optim/total_tokens": 1957532008448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.29140305519104, "created_at": "2025-06-03T06:25:38.036564+00:00"} {"global_step": 233357, "acc_step": 0, "speed/wps": 5513.772934635298, "speed/FLOPS": 243680541662610.06, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043960586190223694, "optim/lr": 2.0020538433296987e-05, "optim/total_tokens": 1957540397056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2988481521606445, "created_at": "2025-06-03T06:25:41.013023+00:00"} {"global_step": 233358, "acc_step": 0, "speed/wps": 5528.825859783541, "speed/FLOPS": 244345803906306.94, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04378209263086319, "optim/lr": 2.001699120820266e-05, "optim/total_tokens": 1957548785664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2864463329315186, "created_at": "2025-06-03T06:25:43.980107+00:00"} {"global_step": 233359, "acc_step": 0, "speed/wps": 5521.369955249916, "speed/FLOPS": 244016291088699.66, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04501556232571602, "optim/lr": 2.0013443983108114e-05, "optim/total_tokens": 1957557174272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2759703397750854, "created_at": "2025-06-03T06:25:46.951221+00:00"} {"global_step": 233360, "acc_step": 0, "speed/wps": 5510.899791339435, "speed/FLOPS": 243553563435013.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0479414276778698, "optim/lr": 2.0009896758013568e-05, "optim/total_tokens": 1957565562880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2755273580551147, "created_at": "2025-06-03T06:25:49.930775+00:00"} {"global_step": 233361, "acc_step": 0, "speed/wps": 5518.539617018916, "speed/FLOPS": 243891204625873.8, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043534550815820694, "optim/lr": 2.0006349532919245e-05, "optim/total_tokens": 1957573951488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2799330949783325, "created_at": "2025-06-03T06:25:52.903074+00:00"} {"global_step": 233362, "acc_step": 0, "speed/wps": 5513.423415342318, "speed/FLOPS": 243665094698862.25, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04663725942373276, "optim/lr": 2.0002802307824695e-05, "optim/total_tokens": 1957582340096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2785714864730835, "created_at": "2025-06-03T06:25:55.878225+00:00"} {"global_step": 233363, "acc_step": 0, "speed/wps": 5515.56350072889, "speed/FLOPS": 243759675518998.75, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044971272349357605, "optim/lr": 1.999925508273015e-05, "optim/total_tokens": 1957590728704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2698698043823242, "created_at": "2025-06-03T06:25:58.855887+00:00"} {"global_step": 233364, "acc_step": 0, "speed/wps": 5522.3479163962265, "speed/FLOPS": 244059511965707.66, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04688262566924095, "optim/lr": 1.9995707857635602e-05, "optim/total_tokens": 1957599117312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.27322518825531, "created_at": "2025-06-03T06:26:01.826416+00:00"} {"global_step": 233365, "acc_step": 0, "speed/wps": 5530.682752469731, "speed/FLOPS": 244427869058598.2, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04555557295680046, "optim/lr": 1.999216063254128e-05, "optim/total_tokens": 1957607505920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2761740684509277, "created_at": "2025-06-03T06:26:04.792571+00:00"} {"global_step": 233366, "acc_step": 0, "speed/wps": 5524.725417605867, "speed/FLOPS": 244164585350019.4, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043489981442689896, "optim/lr": 1.9988613407446733e-05, "optim/total_tokens": 1957615894528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2964222431182861, "created_at": "2025-06-03T06:26:07.765469+00:00"} {"global_step": 233367, "acc_step": 0, "speed/wps": 5526.755207281227, "speed/FLOPS": 244254291664264.94, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04332088306546211, "optim/lr": 1.9985066182352183e-05, "optim/total_tokens": 1957624283136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2826652526855469, "created_at": "2025-06-03T06:26:10.734052+00:00"} {"global_step": 233368, "acc_step": 0, "speed/wps": 5521.5622841269005, "speed/FLOPS": 244024791040633.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.22, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043029990047216415, "optim/lr": 1.9981518957257637e-05, "optim/total_tokens": 1957632671744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2936127185821533, "created_at": "2025-06-03T06:26:13.704822+00:00"} {"global_step": 233369, "acc_step": 0, "speed/wps": 5512.728909568601, "speed/FLOPS": 243634401098466.78, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.65 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.65, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043422188609838486, "optim/lr": 1.9977971732163314e-05, "optim/total_tokens": 1957641060352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2746179103851318, "created_at": "2025-06-03T06:26:16.680400+00:00"} {"global_step": 233370, "acc_step": 0, "speed/wps": 5513.0011840697125, "speed/FLOPS": 243646434237788.7, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043887875974178314, "optim/lr": 1.9974424507068768e-05, "optim/total_tokens": 1957649448960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2876595258712769, "created_at": "2025-06-03T06:26:19.656390+00:00"} {"global_step": 233371, "acc_step": 0, "speed/wps": 5517.339290781143, "speed/FLOPS": 243838156349990.88, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045371029525995255, "optim/lr": 1.997087728197422e-05, "optim/total_tokens": 1957657837568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2994338274002075, "created_at": "2025-06-03T06:26:22.629704+00:00"} {"global_step": 233372, "acc_step": 0, "speed/wps": 5518.6122607561065, "speed/FLOPS": 243894415107233.28, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04308713972568512, "optim/lr": 1.9967330056879675e-05, "optim/total_tokens": 1957666226176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2838726043701172, "created_at": "2025-06-03T06:26:25.604263+00:00"} {"global_step": 233373, "acc_step": 0, "speed/wps": 5531.27430749191, "speed/FLOPS": 244454012762725.4, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 191.88, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04492659494280815, "optim/lr": 1.996378283178535e-05, "optim/total_tokens": 1957674614784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2730286121368408, "created_at": "2025-06-03T06:26:28.571112+00:00"} {"global_step": 233374, "acc_step": 0, "speed/wps": 5521.780851581252, "speed/FLOPS": 244034450603386.62, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043788693845272064, "optim/lr": 1.9960235606690802e-05, "optim/total_tokens": 1957683003392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2815897464752197, "created_at": "2025-06-03T06:26:31.541975+00:00"} {"global_step": 233375, "acc_step": 0, "speed/wps": 5534.7084484769675, "speed/FLOPS": 244605784216737.94, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 191.76, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.051139846444129944, "optim/lr": 1.9956688381596256e-05, "optim/total_tokens": 1957691392000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.287073016166687, "created_at": "2025-06-03T06:26:34.507283+00:00"} {"global_step": 233376, "acc_step": 0, "speed/wps": 5529.682927319695, "speed/FLOPS": 244383681904535.62, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04601406306028366, "optim/lr": 1.995314115650171e-05, "optim/total_tokens": 1957699780608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.282428503036499, "created_at": "2025-06-03T06:26:37.474284+00:00"} {"global_step": 233377, "acc_step": 0, "speed/wps": 5525.595638390637, "speed/FLOPS": 244203044654512.5, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.02, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04954652488231659, "optim/lr": 1.9949593931407384e-05, "optim/total_tokens": 1957708169216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.29969322681427, "created_at": "2025-06-03T06:26:40.443068+00:00"} {"global_step": 233378, "acc_step": 0, "speed/wps": 5525.101668092815, "speed/FLOPS": 244181213695717.97, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04518958553671837, "optim/lr": 1.9946046706312837e-05, "optim/total_tokens": 1957716557824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.288324236869812, "created_at": "2025-06-03T06:26:43.412604+00:00"} {"global_step": 233379, "acc_step": 0, "speed/wps": 5511.3774843315605, "speed/FLOPS": 243574675020211.0, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0481095165014267, "optim/lr": 1.994249948121829e-05, "optim/total_tokens": 1957724946432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2914561033248901, "created_at": "2025-06-03T06:26:46.394722+00:00"} {"global_step": 233380, "acc_step": 0, "speed/wps": 5506.599838149245, "speed/FLOPS": 243363527513162.7, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.64 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.64, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04480770230293274, "optim/lr": 1.9938952256123744e-05, "optim/total_tokens": 1957733335040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2986446619033813, "created_at": "2025-06-03T06:26:49.378804+00:00"} {"global_step": 233381, "acc_step": 0, "speed/wps": 5520.142102417082, "speed/FLOPS": 243962026278208.94, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04543006792664528, "optim/lr": 1.9935405031029418e-05, "optim/total_tokens": 1957741723648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2852741479873657, "created_at": "2025-06-03T06:26:52.350810+00:00"} {"global_step": 233382, "acc_step": 0, "speed/wps": 5528.02991510584, "speed/FLOPS": 244310627225566.72, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.052435971796512604, "optim/lr": 1.9931857805934872e-05, "optim/total_tokens": 1957750112256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.294154405593872, "created_at": "2025-06-03T06:26:55.322047+00:00"} {"global_step": 233383, "acc_step": 0, "speed/wps": 5521.015253960377, "speed/FLOPS": 244000615107227.8, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04538309574127197, "optim/lr": 1.9928310580840325e-05, "optim/total_tokens": 1957758500864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3080984354019165, "created_at": "2025-06-03T06:26:58.297806+00:00"} {"global_step": 233384, "acc_step": 0, "speed/wps": 5526.498722357542, "speed/FLOPS": 244242956343446.9, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04312481731176376, "optim/lr": 1.992476335574578e-05, "optim/total_tokens": 1957766889472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2763460874557495, "created_at": "2025-06-03T06:27:01.268954+00:00"} {"global_step": 233385, "acc_step": 0, "speed/wps": 5522.418371263853, "speed/FLOPS": 244062625710236.06, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0456252358853817, "optim/lr": 1.9921216130651453e-05, "optim/total_tokens": 1957775278080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.286368727684021, "created_at": "2025-06-03T06:27:04.239324+00:00"} {"global_step": 233386, "acc_step": 0, "speed/wps": 5518.576662917654, "speed/FLOPS": 243892841864979.94, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04374498873949051, "optim/lr": 1.9917668905556906e-05, "optim/total_tokens": 1957783666688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2999708652496338, "created_at": "2025-06-03T06:27:07.211475+00:00"} {"global_step": 233387, "acc_step": 0, "speed/wps": 5526.9083877630965, "speed/FLOPS": 244261061457514.8, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045162707567214966, "optim/lr": 1.991412168046236e-05, "optim/total_tokens": 1957792055296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2927418947219849, "created_at": "2025-06-03T06:27:10.180865+00:00"} {"global_step": 233388, "acc_step": 0, "speed/wps": 5514.548294152892, "speed/FLOPS": 243714808584637.94, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04454208165407181, "optim/lr": 1.9910574455368037e-05, "optim/total_tokens": 1957800443904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2911086082458496, "created_at": "2025-06-03T06:27:13.156368+00:00"} {"global_step": 233389, "acc_step": 0, "speed/wps": 5514.458590492994, "speed/FLOPS": 243710844142015.38, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045353639870882034, "optim/lr": 1.9907027230273487e-05, "optim/total_tokens": 1957808832512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2828383445739746, "created_at": "2025-06-03T06:27:16.132314+00:00"} {"global_step": 233390, "acc_step": 0, "speed/wps": 5510.459118572752, "speed/FLOPS": 243534087954293.75, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04462409019470215, "optim/lr": 1.990348000517894e-05, "optim/total_tokens": 1957817221120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2925844192504883, "created_at": "2025-06-03T06:27:19.109499+00:00"} {"global_step": 233391, "acc_step": 0, "speed/wps": 5528.497152606048, "speed/FLOPS": 244331276731537.6, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04721479490399361, "optim/lr": 1.9899932780084395e-05, "optim/total_tokens": 1957825609728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2808407545089722, "created_at": "2025-06-03T06:27:22.076428+00:00"} {"global_step": 233392, "acc_step": 0, "speed/wps": 5523.86027360804, "speed/FLOPS": 244126350413523.88, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04500105232000351, "optim/lr": 1.9896385554990072e-05, "optim/total_tokens": 1957833998336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2850310802459717, "created_at": "2025-06-03T06:27:25.049320+00:00"} {"global_step": 233393, "acc_step": 0, "speed/wps": 5525.839964578257, "speed/FLOPS": 244213842621430.53, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05286498740315437, "optim/lr": 1.9892838329895526e-05, "optim/total_tokens": 1957842386944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2725646495819092, "created_at": "2025-06-03T06:27:28.017960+00:00"} {"global_step": 233394, "acc_step": 0, "speed/wps": 5513.413955012844, "speed/FLOPS": 243664676600721.88, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04359247535467148, "optim/lr": 1.9889291104800976e-05, "optim/total_tokens": 1957850775552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2958616018295288, "created_at": "2025-06-03T06:27:30.996522+00:00"} {"global_step": 233395, "acc_step": 0, "speed/wps": 5512.653417059483, "speed/FLOPS": 243631064715969.47, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04833676293492317, "optim/lr": 1.988574387970643e-05, "optim/total_tokens": 1957859164160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2965972423553467, "created_at": "2025-06-03T06:27:33.974535+00:00"} {"global_step": 233396, "acc_step": 0, "speed/wps": 5509.167045348269, "speed/FLOPS": 243476984931201.9, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.63 hours", "speed/est_time_elapsed_hrs": 192.67, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.63, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04362925514578819, "optim/lr": 1.9882196654612107e-05, "optim/total_tokens": 1957867552768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2604811191558838, "created_at": "2025-06-03T06:27:36.952070+00:00"} {"global_step": 233397, "acc_step": 0, "speed/wps": 5508.426385064906, "speed/FLOPS": 243444251537720.22, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0473751500248909, "optim/lr": 1.987864942951756e-05, "optim/total_tokens": 1957875941376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2962907552719116, "created_at": "2025-06-03T06:27:39.931220+00:00"} {"global_step": 233398, "acc_step": 0, "speed/wps": 5524.0592638131875, "speed/FLOPS": 244135144762067.2, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043847400695085526, "optim/lr": 1.9875102204423014e-05, "optim/total_tokens": 1957884329984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.297921061515808, "created_at": "2025-06-03T06:27:42.900826+00:00"} {"global_step": 233399, "acc_step": 0, "speed/wps": 5517.128714662568, "speed/FLOPS": 243828849963376.16, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04685153812170029, "optim/lr": 1.9871554979328464e-05, "optim/total_tokens": 1957892718592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.285383701324463, "created_at": "2025-06-03T06:27:45.873705+00:00"} {"global_step": 233400, "acc_step": 0, "speed/wps": 5523.788720912615, "speed/FLOPS": 244123188150625.97, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04524970427155495, "optim/lr": 1.986800775423414e-05, "optim/total_tokens": 1957901107200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2848674058914185, "created_at": "2025-06-03T06:27:48.845021+00:00"} {"global_step": 233401, "acc_step": 0, "speed/wps": 5514.980601130318, "speed/FLOPS": 243733914340292.47, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04451962932944298, "optim/lr": 1.9864460529139595e-05, "optim/total_tokens": 1957909495808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2715349197387695, "created_at": "2025-06-03T06:27:51.822261+00:00"} {"global_step": 233402, "acc_step": 0, "speed/wps": 5519.16709406457, "speed/FLOPS": 243918935899573.03, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.047345057129859924, "optim/lr": 1.986091330404505e-05, "optim/total_tokens": 1957917884416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2896863222122192, "created_at": "2025-06-03T06:27:54.794000+00:00"} {"global_step": 233403, "acc_step": 0, "speed/wps": 5513.203694394578, "speed/FLOPS": 243655384157605.9, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046122580766677856, "optim/lr": 1.9857366078950502e-05, "optim/total_tokens": 1957926273024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2805805206298828, "created_at": "2025-06-03T06:27:57.769175+00:00"} {"global_step": 233404, "acc_step": 0, "speed/wps": 5515.918695613116, "speed/FLOPS": 243775373314829.3, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04299626499414444, "optim/lr": 1.9853818853856176e-05, "optim/total_tokens": 1957934661632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2892694473266602, "created_at": "2025-06-03T06:28:00.746476+00:00"} {"global_step": 233405, "acc_step": 0, "speed/wps": 5516.405768804833, "speed/FLOPS": 243796899456836.62, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043463923037052155, "optim/lr": 1.985027162876163e-05, "optim/total_tokens": 1957943050240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.298785924911499, "created_at": "2025-06-03T06:28:03.721928+00:00"} {"global_step": 233406, "acc_step": 0, "speed/wps": 5515.925586740479, "speed/FLOPS": 243775677867386.75, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04418123513460159, "optim/lr": 1.9846724403667083e-05, "optim/total_tokens": 1957951438848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2840168476104736, "created_at": "2025-06-03T06:28:06.699418+00:00"} {"global_step": 233407, "acc_step": 0, "speed/wps": 5519.35376808892, "speed/FLOPS": 243927185935965.06, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04395219311118126, "optim/lr": 1.9843177178572537e-05, "optim/total_tokens": 1957959827456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2885441780090332, "created_at": "2025-06-03T06:28:09.673118+00:00"} {"global_step": 233408, "acc_step": 0, "speed/wps": 5517.567312670896, "speed/FLOPS": 243848233750396.12, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0437757782638073, "optim/lr": 1.983962995347821e-05, "optim/total_tokens": 1957968216064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2821424007415771, "created_at": "2025-06-03T06:28:12.648546+00:00"} {"global_step": 233409, "acc_step": 0, "speed/wps": 5513.496657534179, "speed/FLOPS": 243668331628855.0, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04341159388422966, "optim/lr": 1.9836082728383664e-05, "optim/total_tokens": 1957976604672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2897870540618896, "created_at": "2025-06-03T06:28:15.623809+00:00"} {"global_step": 233410, "acc_step": 0, "speed/wps": 5508.520126638849, "speed/FLOPS": 243448394435475.66, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04333384335041046, "optim/lr": 1.9832535503289118e-05, "optim/total_tokens": 1957984993280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2880340814590454, "created_at": "2025-06-03T06:28:18.601650+00:00"} {"global_step": 233411, "acc_step": 0, "speed/wps": 5514.026876058189, "speed/FLOPS": 243691764573711.84, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043292075395584106, "optim/lr": 1.982898827819457e-05, "optim/total_tokens": 1957993381888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.284556269645691, "created_at": "2025-06-03T06:28:21.576985+00:00"} {"global_step": 233412, "acc_step": 0, "speed/wps": 5515.32016801906, "speed/FLOPS": 243748921458713.97, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04289190471172333, "optim/lr": 1.9825441053100245e-05, "optim/total_tokens": 1958001770496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2892913818359375, "created_at": "2025-06-03T06:28:24.550732+00:00"} {"global_step": 233413, "acc_step": 0, "speed/wps": 5508.4321540498795, "speed/FLOPS": 243444506497327.72, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04639577493071556, "optim/lr": 1.98218938280057e-05, "optim/total_tokens": 1958010159104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2863798141479492, "created_at": "2025-06-03T06:28:27.533933+00:00"} {"global_step": 233414, "acc_step": 0, "speed/wps": 5496.345139736062, "speed/FLOPS": 242910322331604.62, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.62 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.62, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04398060217499733, "optim/lr": 1.9818346602911152e-05, "optim/total_tokens": 1958018547712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.293856143951416, "created_at": "2025-06-03T06:28:30.519621+00:00"} {"global_step": 233415, "acc_step": 0, "speed/wps": 5515.4390159341465, "speed/FLOPS": 243754173928242.03, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04487099125981331, "optim/lr": 1.9814799377816826e-05, "optim/total_tokens": 1958026936320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.29106605052948, "created_at": "2025-06-03T06:28:33.493608+00:00"} {"global_step": 233416, "acc_step": 0, "speed/wps": 5520.3178933181725, "speed/FLOPS": 243969795336257.72, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044734887778759, "optim/lr": 1.981125215272228e-05, "optim/total_tokens": 1958035324928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2923921346664429, "created_at": "2025-06-03T06:28:36.465159+00:00"} {"global_step": 233417, "acc_step": 0, "speed/wps": 5520.30996962519, "speed/FLOPS": 243969445149585.03, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045941926538944244, "optim/lr": 1.9807704927627733e-05, "optim/total_tokens": 1958043713536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2853881120681763, "created_at": "2025-06-03T06:28:39.436418+00:00"} {"global_step": 233418, "acc_step": 0, "speed/wps": 5533.097211462393, "speed/FLOPS": 244534575787752.4, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04745229706168175, "optim/lr": 1.9804157702533187e-05, "optim/total_tokens": 1958052102144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2743605375289917, "created_at": "2025-06-03T06:28:42.401011+00:00"} {"global_step": 233419, "acc_step": 0, "speed/wps": 5521.430251350796, "speed/FLOPS": 244018955867735.16, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04595847427845001, "optim/lr": 1.9800610477438864e-05, "optim/total_tokens": 1958060490752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2921675443649292, "created_at": "2025-06-03T06:28:45.371867+00:00"} {"global_step": 233420, "acc_step": 0, "speed/wps": 5513.912452753925, "speed/FLOPS": 243686707649334.9, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.050892602652311325, "optim/lr": 1.9797063252344314e-05, "optim/total_tokens": 1958068879360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2805088758468628, "created_at": "2025-06-03T06:28:48.350377+00:00"} {"global_step": 233421, "acc_step": 0, "speed/wps": 5506.807310918055, "speed/FLOPS": 243372696747602.16, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04404807463288307, "optim/lr": 1.9793516027249768e-05, "optim/total_tokens": 1958077267968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2821639776229858, "created_at": "2025-06-03T06:28:51.332984+00:00"} {"global_step": 233422, "acc_step": 0, "speed/wps": 5499.601810247225, "speed/FLOPS": 243054250499047.28, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.61 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.61, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04616366699337959, "optim/lr": 1.9789968802155222e-05, "optim/total_tokens": 1958085656576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2994015216827393, "created_at": "2025-06-03T06:28:54.319083+00:00"} {"global_step": 233423, "acc_step": 0, "speed/wps": 5519.546529738778, "speed/FLOPS": 243935705014245.22, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044850606471300125, "optim/lr": 1.97864215770609e-05, "optim/total_tokens": 1958094045184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2838666439056396, "created_at": "2025-06-03T06:28:57.290872+00:00"} {"global_step": 233424, "acc_step": 0, "speed/wps": 5525.357162594116, "speed/FLOPS": 244192505244936.03, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04382740333676338, "optim/lr": 1.9782874351966353e-05, "optim/total_tokens": 1958102433792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2707018852233887, "created_at": "2025-06-03T06:29:00.261786+00:00"} {"global_step": 233425, "acc_step": 0, "speed/wps": 5520.774077760205, "speed/FLOPS": 243989956353631.9, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04315173625946045, "optim/lr": 1.9779327126871806e-05, "optim/total_tokens": 1958110822400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2762725353240967, "created_at": "2025-06-03T06:29:03.235992+00:00"} {"global_step": 233426, "acc_step": 0, "speed/wps": 5514.192711843409, "speed/FLOPS": 243699093666594.03, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04343060404062271, "optim/lr": 1.9775779901777256e-05, "optim/total_tokens": 1958119211008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2896336317062378, "created_at": "2025-06-03T06:29:06.214731+00:00"} {"global_step": 233427, "acc_step": 0, "speed/wps": 5517.151312991126, "speed/FLOPS": 243829848693829.7, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04375848174095154, "optim/lr": 1.9772232676682934e-05, "optim/total_tokens": 1958127599616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2876931428909302, "created_at": "2025-06-03T06:29:09.191077+00:00"} {"global_step": 233428, "acc_step": 0, "speed/wps": 5525.209583336199, "speed/FLOPS": 244185982997115.25, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043640121817588806, "optim/lr": 1.9768685451588387e-05, "optim/total_tokens": 1958135988224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2993396520614624, "created_at": "2025-06-03T06:29:12.160177+00:00"} {"global_step": 233429, "acc_step": 0, "speed/wps": 5511.591635951544, "speed/FLOPS": 243584139425686.94, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04343325272202492, "optim/lr": 1.976513822649384e-05, "optim/total_tokens": 1958144376832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2689011096954346, "created_at": "2025-06-03T06:29:15.138675+00:00"} {"global_step": 233430, "acc_step": 0, "speed/wps": 5524.264167260335, "speed/FLOPS": 244144200445640.2, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04364660382270813, "optim/lr": 1.9761591001399294e-05, "optim/total_tokens": 1958152765440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.3041565418243408, "created_at": "2025-06-03T06:29:18.108688+00:00"} {"global_step": 233431, "acc_step": 0, "speed/wps": 5509.402612017751, "speed/FLOPS": 243487395772253.5, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.6 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.6, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04664444178342819, "optim/lr": 1.9758043776304968e-05, "optim/total_tokens": 1958161154048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2839564085006714, "created_at": "2025-06-03T06:29:21.087715+00:00"} {"global_step": 233432, "acc_step": 0, "speed/wps": 5512.4626056441375, "speed/FLOPS": 243622631828072.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.15921609103679657, "optim/lr": 1.9754496551210422e-05, "optim/total_tokens": 1958169542656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.255197286605835, "created_at": "2025-06-03T06:29:24.064333+00:00"} {"global_step": 233433, "acc_step": 0, "speed/wps": 5535.498035904956, "speed/FLOPS": 244640679939580.2, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 191.78, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05126357823610306, "optim/lr": 1.9750949326115875e-05, "optim/total_tokens": 1958177931264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.279534935951233, "created_at": "2025-06-03T06:29:27.030871+00:00"} {"global_step": 233434, "acc_step": 0, "speed/wps": 5512.473548205355, "speed/FLOPS": 243623115433269.25, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.048909448087215424, "optim/lr": 1.974740210102133e-05, "optim/total_tokens": 1958186319872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2938730716705322, "created_at": "2025-06-03T06:29:30.008574+00:00"} {"global_step": 233435, "acc_step": 0, "speed/wps": 5524.223468890424, "speed/FLOPS": 244142401786003.25, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05312490835785866, "optim/lr": 1.9743854875927003e-05, "optim/total_tokens": 1958194708480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.29604172706604, "created_at": "2025-06-03T06:29:32.978798+00:00"} {"global_step": 233436, "acc_step": 0, "speed/wps": 5532.360168429682, "speed/FLOPS": 244502002258234.78, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 191.94, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05418088659644127, "optim/lr": 1.9740307650832456e-05, "optim/total_tokens": 1958203097088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2774972915649414, "created_at": "2025-06-03T06:29:35.943558+00:00"} {"global_step": 233437, "acc_step": 0, "speed/wps": 5522.810831561673, "speed/FLOPS": 244079970446605.78, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05024363473057747, "optim/lr": 1.973676042573791e-05, "optim/total_tokens": 1958211485696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.293349266052246, "created_at": "2025-06-03T06:29:38.914502+00:00"} {"global_step": 233438, "acc_step": 0, "speed/wps": 5514.218561903857, "speed/FLOPS": 243700236106953.25, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.049063071608543396, "optim/lr": 1.9733213200643364e-05, "optim/total_tokens": 1958219874304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2791603803634644, "created_at": "2025-06-03T06:29:41.889992+00:00"} {"global_step": 233439, "acc_step": 0, "speed/wps": 5506.264839714711, "speed/FLOPS": 243348722297033.7, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0534060001373291, "optim/lr": 1.9729665975549038e-05, "optim/total_tokens": 1958228262912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.291914463043213, "created_at": "2025-06-03T06:29:44.868983+00:00"} {"global_step": 233440, "acc_step": 0, "speed/wps": 5535.350925928333, "speed/FLOPS": 244634178431590.6, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 191.8, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04706574231386185, "optim/lr": 1.972611875045449e-05, "optim/total_tokens": 1958236651520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2730374336242676, "created_at": "2025-06-03T06:29:47.835587+00:00"} {"global_step": 233441, "acc_step": 0, "speed/wps": 5532.143116445262, "speed/FLOPS": 244492409671496.22, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 191.86, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.047244396060705185, "optim/lr": 1.9722571525359945e-05, "optim/total_tokens": 1958245040128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2680143117904663, "created_at": "2025-06-03T06:29:50.800814+00:00"} {"global_step": 233442, "acc_step": 0, "speed/wps": 5527.475635736983, "speed/FLOPS": 244286130914522.28, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043791528791189194, "optim/lr": 1.971902430026562e-05, "optim/total_tokens": 1958253428736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2883328199386597, "created_at": "2025-06-03T06:29:53.768846+00:00"} {"global_step": 233443, "acc_step": 0, "speed/wps": 5514.553015888403, "speed/FLOPS": 243715017261179.5, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045859213918447495, "optim/lr": 1.9715477075171072e-05, "optim/total_tokens": 1958261817344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.270887017250061, "created_at": "2025-06-03T06:29:56.745079+00:00"} {"global_step": 233444, "acc_step": 0, "speed/wps": 5505.487978382337, "speed/FLOPS": 243314389002479.53, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044108062982559204, "optim/lr": 1.9711929850076526e-05, "optim/total_tokens": 1958270205952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.290023922920227, "created_at": "2025-06-03T06:29:59.724810+00:00"} {"global_step": 233445, "acc_step": 0, "speed/wps": 5520.825757374162, "speed/FLOPS": 243992240328048.56, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04422922432422638, "optim/lr": 1.970838262498198e-05, "optim/total_tokens": 1958278594560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.288589358329773, "created_at": "2025-06-03T06:30:02.698401+00:00"} {"global_step": 233446, "acc_step": 0, "speed/wps": 5518.009859556799, "speed/FLOPS": 243867792057592.72, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04436848685145378, "optim/lr": 1.9704835399887657e-05, "optim/total_tokens": 1958286983168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2639588117599487, "created_at": "2025-06-03T06:30:05.671320+00:00"} {"global_step": 233447, "acc_step": 0, "speed/wps": 5502.215761082872, "speed/FLOPS": 243169773746569.6, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.59 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.59, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.052991874516010284, "optim/lr": 1.9701288174793107e-05, "optim/total_tokens": 1958295371776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.272891640663147, "created_at": "2025-06-03T06:30:08.653658+00:00"} {"global_step": 233448, "acc_step": 0, "speed/wps": 5512.362620974659, "speed/FLOPS": 243618213017449.53, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04828387871384621, "optim/lr": 1.969774094969856e-05, "optim/total_tokens": 1958303760384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2864344120025635, "created_at": "2025-06-03T06:30:11.629464+00:00"} {"global_step": 233449, "acc_step": 0, "speed/wps": 5520.957917612252, "speed/FLOPS": 243998081134114.72, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04514652118086815, "optim/lr": 1.9694193724604014e-05, "optim/total_tokens": 1958312148992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2739640474319458, "created_at": "2025-06-03T06:30:14.604754+00:00"} {"global_step": 233450, "acc_step": 0, "speed/wps": 5521.587305182451, "speed/FLOPS": 244025896843219.9, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05024569481611252, "optim/lr": 1.969064649950969e-05, "optim/total_tokens": 1958320537600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.287530779838562, "created_at": "2025-06-03T06:30:17.579354+00:00"} {"global_step": 233451, "acc_step": 0, "speed/wps": 5525.064236514324, "speed/FLOPS": 244179559411540.84, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04639575257897377, "optim/lr": 1.9687099274415145e-05, "optim/total_tokens": 1958328926208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.273230791091919, "created_at": "2025-06-03T06:30:20.550178+00:00"} {"global_step": 233452, "acc_step": 0, "speed/wps": 5526.085130832728, "speed/FLOPS": 244224677715003.5, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04494241625070572, "optim/lr": 1.9683552049320595e-05, "optim/total_tokens": 1958337314816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2885180711746216, "created_at": "2025-06-03T06:30:23.518471+00:00"} {"global_step": 233453, "acc_step": 0, "speed/wps": 5507.820663184407, "speed/FLOPS": 243417481730967.8, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04651850834488869, "optim/lr": 1.968000482422605e-05, "optim/total_tokens": 1958345703424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.291381597518921, "created_at": "2025-06-03T06:30:26.496300+00:00"} {"global_step": 233454, "acc_step": 0, "speed/wps": 5517.2645102915285, "speed/FLOPS": 243834851435111.16, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044354524463415146, "optim/lr": 1.9676457599131726e-05, "optim/total_tokens": 1958354092032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2911759614944458, "created_at": "2025-06-03T06:30:29.469443+00:00"} {"global_step": 233455, "acc_step": 0, "speed/wps": 5521.073263792871, "speed/FLOPS": 244003178844902.8, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04663288593292236, "optim/lr": 1.967291037403718e-05, "optim/total_tokens": 1958362480640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2840220928192139, "created_at": "2025-06-03T06:30:32.442305+00:00"} {"global_step": 233456, "acc_step": 0, "speed/wps": 5506.241310216521, "speed/FLOPS": 243347682413648.56, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04608731344342232, "optim/lr": 1.9669363148942633e-05, "optim/total_tokens": 1958370869248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2930055856704712, "created_at": "2025-06-03T06:30:35.421910+00:00"} {"global_step": 233457, "acc_step": 0, "speed/wps": 5499.895109193471, "speed/FLOPS": 243067212811231.25, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.58 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.58, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0461244061589241, "optim/lr": 1.9665815923848083e-05, "optim/total_tokens": 1958379257856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2715115547180176, "created_at": "2025-06-03T06:30:38.405232+00:00"} {"global_step": 233458, "acc_step": 0, "speed/wps": 5529.324524701664, "speed/FLOPS": 244367842343289.53, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04434135928750038, "optim/lr": 1.966226869875376e-05, "optim/total_tokens": 1958387646464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2672172784805298, "created_at": "2025-06-03T06:30:41.374310+00:00"} {"global_step": 233459, "acc_step": 0, "speed/wps": 5522.855059575671, "speed/FLOPS": 244081925098444.97, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04862052574753761, "optim/lr": 1.9658721473659214e-05, "optim/total_tokens": 1958396035072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2871335744857788, "created_at": "2025-06-03T06:30:44.344523+00:00"} {"global_step": 233460, "acc_step": 0, "speed/wps": 5528.229036029846, "speed/FLOPS": 244319427351214.5, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.12, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045391861349344254, "optim/lr": 1.9655174248564668e-05, "optim/total_tokens": 1958404423680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2759463787078857, "created_at": "2025-06-03T06:30:47.316046+00:00"} {"global_step": 233461, "acc_step": 0, "speed/wps": 5516.521952387558, "speed/FLOPS": 243802034176511.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04326486214995384, "optim/lr": 1.965162702347012e-05, "optim/total_tokens": 1958412812288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2897895574569702, "created_at": "2025-06-03T06:30:50.290613+00:00"} {"global_step": 233462, "acc_step": 0, "speed/wps": 5522.6215931102815, "speed/FLOPS": 244071607075664.5, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043736059218645096, "optim/lr": 1.9648079798375795e-05, "optim/total_tokens": 1958421200896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2948662042617798, "created_at": "2025-06-03T06:30:53.260751+00:00"} {"global_step": 233463, "acc_step": 0, "speed/wps": 5511.968602896815, "speed/FLOPS": 243600799435176.2, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04619116708636284, "optim/lr": 1.964453257328125e-05, "optim/total_tokens": 1958429589504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2868342399597168, "created_at": "2025-06-03T06:30:56.237407+00:00"} {"global_step": 233464, "acc_step": 0, "speed/wps": 5506.398247425999, "speed/FLOPS": 243354618235030.06, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04353053867816925, "optim/lr": 1.9640985348186702e-05, "optim/total_tokens": 1958437978112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2849496603012085, "created_at": "2025-06-03T06:30:59.216607+00:00"} {"global_step": 233465, "acc_step": 0, "speed/wps": 5504.493596112747, "speed/FLOPS": 243270442395873.47, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05065149813890457, "optim/lr": 1.9637438123092156e-05, "optim/total_tokens": 1958446366720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2925846576690674, "created_at": "2025-06-03T06:31:02.197286+00:00"} {"global_step": 233466, "acc_step": 0, "speed/wps": 5517.651381525171, "speed/FLOPS": 243851949163451.7, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04453879967331886, "optim/lr": 1.963389089799783e-05, "optim/total_tokens": 1958454755328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.288092851638794, "created_at": "2025-06-03T06:31:05.173963+00:00"} {"global_step": 233467, "acc_step": 0, "speed/wps": 5515.480413261698, "speed/FLOPS": 243756003478229.06, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.047412119805812836, "optim/lr": 1.9630343672903283e-05, "optim/total_tokens": 1958463143936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2857128381729126, "created_at": "2025-06-03T06:31:08.148229+00:00"} {"global_step": 233468, "acc_step": 0, "speed/wps": 5518.034403609086, "speed/FLOPS": 243868876779076.0, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045093730092048645, "optim/lr": 1.9626796447808737e-05, "optim/total_tokens": 1958471532544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2891734838485718, "created_at": "2025-06-03T06:31:11.120775+00:00"} {"global_step": 233469, "acc_step": 0, "speed/wps": 5518.269954188747, "speed/FLOPS": 243879286909039.8, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04451422020792961, "optim/lr": 1.962324922271441e-05, "optim/total_tokens": 1958479921152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2709704637527466, "created_at": "2025-06-03T06:31:14.094413+00:00"} {"global_step": 233470, "acc_step": 0, "speed/wps": 5525.388940649859, "speed/FLOPS": 244193909672345.06, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045117709785699844, "optim/lr": 1.9619701997619865e-05, "optim/total_tokens": 1958488309760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2952739000320435, "created_at": "2025-06-03T06:31:17.063087+00:00"} {"global_step": 233471, "acc_step": 0, "speed/wps": 5525.101932717652, "speed/FLOPS": 244181225390781.25, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04661129415035248, "optim/lr": 1.9616154772525318e-05, "optim/total_tokens": 1958496698368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2903581857681274, "created_at": "2025-06-03T06:31:20.035436+00:00"} {"global_step": 233472, "acc_step": 0, "speed/wps": 5517.294924390064, "speed/FLOPS": 243836195582592.94, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045971281826496124, "optim/lr": 1.9612607547430772e-05, "optim/total_tokens": 1958505086976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2656512260437012, "created_at": "2025-06-03T06:31:23.011552+00:00"} {"global_step": 233473, "acc_step": 0, "speed/wps": 5501.049692509783, "speed/FLOPS": 243118239484119.1, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.57 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.57, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.047033313661813736, "optim/lr": 1.9609060322336446e-05, "optim/total_tokens": 1958513475584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2806605100631714, "created_at": "2025-06-03T06:31:25.993553+00:00"} {"global_step": 233474, "acc_step": 0, "speed/wps": 5522.789404402115, "speed/FLOPS": 244079023475827.47, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04527255892753601, "optim/lr": 1.96055130972419e-05, "optim/total_tokens": 1958521864192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2965004444122314, "created_at": "2025-06-03T06:31:28.967504+00:00"} {"global_step": 233475, "acc_step": 0, "speed/wps": 5522.001509796929, "speed/FLOPS": 244044202567088.4, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04555024951696396, "optim/lr": 1.9601965872147353e-05, "optim/total_tokens": 1958530252800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2758710384368896, "created_at": "2025-06-03T06:31:31.940727+00:00"} {"global_step": 233476, "acc_step": 0, "speed/wps": 5514.792095541329, "speed/FLOPS": 243725583358118.25, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04346057400107384, "optim/lr": 1.9598418647052806e-05, "optim/total_tokens": 1958538641408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2749993801116943, "created_at": "2025-06-03T06:31:34.918487+00:00"} {"global_step": 233477, "acc_step": 0, "speed/wps": 5521.508384627907, "speed/FLOPS": 244022408958661.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04901769384741783, "optim/lr": 1.9594871421958484e-05, "optim/total_tokens": 1958547030016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.290283203125, "created_at": "2025-06-03T06:31:37.890152+00:00"} {"global_step": 233478, "acc_step": 0, "speed/wps": 5509.321536773461, "speed/FLOPS": 243483812661436.6, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04351356253027916, "optim/lr": 1.9591324196863934e-05, "optim/total_tokens": 1958555418624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2945401668548584, "created_at": "2025-06-03T06:31:40.870845+00:00"} {"global_step": 233479, "acc_step": 0, "speed/wps": 5510.481827568037, "speed/FLOPS": 243535091575650.2, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04750022664666176, "optim/lr": 1.9587776971769387e-05, "optim/total_tokens": 1958563807232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2859772443771362, "created_at": "2025-06-03T06:31:43.847953+00:00"} {"global_step": 233480, "acc_step": 0, "speed/wps": 5504.670810474749, "speed/FLOPS": 243278274363608.62, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045514367520809174, "optim/lr": 1.958422974667484e-05, "optim/total_tokens": 1958572195840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.295698642730713, "created_at": "2025-06-03T06:31:46.831941+00:00"} {"global_step": 233481, "acc_step": 0, "speed/wps": 5509.136137234004, "speed/FLOPS": 243475618950753.47, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.56 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.56, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04382219538092613, "optim/lr": 1.9580682521580518e-05, "optim/total_tokens": 1958580584448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2912843227386475, "created_at": "2025-06-03T06:31:49.809498+00:00"} {"global_step": 233482, "acc_step": 0, "speed/wps": 5512.420298846519, "speed/FLOPS": 243620762084163.6, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04453109949827194, "optim/lr": 1.9577135296485972e-05, "optim/total_tokens": 1958588973056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2897636890411377, "created_at": "2025-06-03T06:31:52.789008+00:00"} {"global_step": 233483, "acc_step": 0, "speed/wps": 5528.167559902257, "speed/FLOPS": 244316710421038.44, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043494511395692825, "optim/lr": 1.9573588071391425e-05, "optim/total_tokens": 1958597361664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2885990142822266, "created_at": "2025-06-03T06:31:55.757325+00:00"} {"global_step": 233484, "acc_step": 0, "speed/wps": 5521.488622998341, "speed/FLOPS": 244021535595783.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0440606065094471, "optim/lr": 1.9570040846296876e-05, "optim/total_tokens": 1958605750272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2780481576919556, "created_at": "2025-06-03T06:31:58.728220+00:00"} {"global_step": 233485, "acc_step": 0, "speed/wps": 5518.930821521893, "speed/FLOPS": 243908493862539.25, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.042860038578510284, "optim/lr": 1.9566493621202553e-05, "optim/total_tokens": 1958614138880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2870205640792847, "created_at": "2025-06-03T06:32:01.701360+00:00"} {"global_step": 233486, "acc_step": 0, "speed/wps": 5518.257023976324, "speed/FLOPS": 243878715459833.53, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04353328049182892, "optim/lr": 1.9562946396108007e-05, "optim/total_tokens": 1958622527488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.3107625246047974, "created_at": "2025-06-03T06:32:04.676453+00:00"} {"global_step": 233487, "acc_step": 0, "speed/wps": 5511.170853598051, "speed/FLOPS": 243565542999421.84, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04421522095799446, "optim/lr": 1.955939917101346e-05, "optim/total_tokens": 1958630916096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.281339406967163, "created_at": "2025-06-03T06:32:07.654452+00:00"} {"global_step": 233488, "acc_step": 0, "speed/wps": 5503.381506765346, "speed/FLOPS": 243221293738907.66, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04365022853016853, "optim/lr": 1.9555851945918914e-05, "optim/total_tokens": 1958639304704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2922673225402832, "created_at": "2025-06-03T06:32:10.635046+00:00"} {"global_step": 233489, "acc_step": 0, "speed/wps": 5504.384836925939, "speed/FLOPS": 243265635796496.56, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.042741671204566956, "optim/lr": 1.9552304720824588e-05, "optim/total_tokens": 1958647693312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2844858169555664, "created_at": "2025-06-03T06:32:13.619534+00:00"} {"global_step": 233490, "acc_step": 0, "speed/wps": 5511.55587047971, "speed/FLOPS": 243582558774896.16, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04502738639712334, "optim/lr": 1.954875749573004e-05, "optim/total_tokens": 1958656081920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2959380149841309, "created_at": "2025-06-03T06:32:16.600742+00:00"} {"global_step": 233491, "acc_step": 0, "speed/wps": 5518.670357733353, "speed/FLOPS": 243896982696260.28, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04846766218543053, "optim/lr": 1.9545210270635495e-05, "optim/total_tokens": 1958664470528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2840633392333984, "created_at": "2025-06-03T06:32:19.575130+00:00"} {"global_step": 233492, "acc_step": 0, "speed/wps": 5516.080492914242, "speed/FLOPS": 243782523927385.44, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0435572974383831, "optim/lr": 1.954166304554095e-05, "optim/total_tokens": 1958672859136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2842665910720825, "created_at": "2025-06-03T06:32:22.553564+00:00"} {"global_step": 233493, "acc_step": 0, "speed/wps": 5512.312301828102, "speed/FLOPS": 243615989168728.44, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.050859373062849045, "optim/lr": 1.9538115820446622e-05, "optim/total_tokens": 1958681247744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2920576333999634, "created_at": "2025-06-03T06:32:25.529147+00:00"} {"global_step": 233494, "acc_step": 0, "speed/wps": 5516.429892085703, "speed/FLOPS": 243797965582376.9, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04390818998217583, "optim/lr": 1.9534568595352076e-05, "optim/total_tokens": 1958689636352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.267822504043579, "created_at": "2025-06-03T06:32:28.502275+00:00"} {"global_step": 233495, "acc_step": 0, "speed/wps": 5517.551159654718, "speed/FLOPS": 243847519869759.66, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.047471798956394196, "optim/lr": 1.953102137025753e-05, "optim/total_tokens": 1958698024960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2855708599090576, "created_at": "2025-06-03T06:32:31.475213+00:00"} {"global_step": 233496, "acc_step": 0, "speed/wps": 5514.146410576634, "speed/FLOPS": 243697047387593.94, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044121671468019485, "optim/lr": 1.9527474145162983e-05, "optim/total_tokens": 1958706413568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.276817798614502, "created_at": "2025-06-03T06:32:34.452861+00:00"} {"global_step": 233497, "acc_step": 0, "speed/wps": 5501.31807015802, "speed/FLOPS": 243130100402489.84, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04374395310878754, "optim/lr": 1.9523926920068657e-05, "optim/total_tokens": 1958714802176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2839961051940918, "created_at": "2025-06-03T06:32:37.440159+00:00"} {"global_step": 233498, "acc_step": 0, "speed/wps": 5501.389877129837, "speed/FLOPS": 243133273903102.75, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04348758980631828, "optim/lr": 1.952037969497411e-05, "optim/total_tokens": 1958723190784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.272700309753418, "created_at": "2025-06-03T06:32:40.426969+00:00"} {"global_step": 233499, "acc_step": 0, "speed/wps": 5503.449953538135, "speed/FLOPS": 243224318735922.56, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.55 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.55, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044842030853033066, "optim/lr": 1.9516832469879564e-05, "optim/total_tokens": 1958731579392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.284326434135437, "created_at": "2025-06-03T06:32:43.410845+00:00"} {"global_step": 233500, "acc_step": 0, "speed/wps": 5532.693409828012, "speed/FLOPS": 244516729822356.88, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.0, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046047408133745193, "optim/lr": 1.9513285244785238e-05, "optim/total_tokens": 1958739968000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2959426641464233, "created_at": "2025-06-03T06:32:46.380890+00:00"} {"global_step": 233501, "acc_step": 0, "speed/wps": 5510.488169601694, "speed/FLOPS": 243535371861076.34, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04650089517235756, "optim/lr": 1.950973801969069e-05, "optim/total_tokens": 1958748356608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2855935096740723, "created_at": "2025-06-03T06:32:49.357186+00:00"} {"global_step": 233502, "acc_step": 0, "speed/wps": 5518.392303048393, "speed/FLOPS": 243884694102397.94, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04614171013236046, "optim/lr": 1.9506190794596145e-05, "optim/total_tokens": 1958756745216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.296857237815857, "created_at": "2025-06-03T06:32:52.335452+00:00"} {"global_step": 233503, "acc_step": 0, "speed/wps": 5504.983930835597, "speed/FLOPS": 243292112680862.8, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04477018490433693, "optim/lr": 1.95026435695016e-05, "optim/total_tokens": 1958765133824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.274328589439392, "created_at": "2025-06-03T06:32:55.319349+00:00"} {"global_step": 233504, "acc_step": 0, "speed/wps": 5502.741745678924, "speed/FLOPS": 243193019573481.9, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.048765089362859726, "optim/lr": 1.9499096344407276e-05, "optim/total_tokens": 1958773522432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2842938899993896, "created_at": "2025-06-03T06:32:58.305929+00:00"} {"global_step": 233505, "acc_step": 0, "speed/wps": 5514.044598055114, "speed/FLOPS": 243692547795266.5, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04478307068347931, "optim/lr": 1.9495549119312726e-05, "optim/total_tokens": 1958781911040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2860512733459473, "created_at": "2025-06-03T06:33:01.280600+00:00"} {"global_step": 233506, "acc_step": 0, "speed/wps": 5511.636668729507, "speed/FLOPS": 243586129643974.22, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05039975792169571, "optim/lr": 1.949200189421818e-05, "optim/total_tokens": 1958790299648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2709503173828125, "created_at": "2025-06-03T06:33:04.260748+00:00"} {"global_step": 233507, "acc_step": 0, "speed/wps": 5518.805432004047, "speed/FLOPS": 243902952287652.2, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04381726309657097, "optim/lr": 1.9488454669123633e-05, "optim/total_tokens": 1958798688256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2854660749435425, "created_at": "2025-06-03T06:33:07.233571+00:00"} {"global_step": 233508, "acc_step": 0, "speed/wps": 5524.976977954518, "speed/FLOPS": 244175703029827.2, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.048643581569194794, "optim/lr": 1.948490744402931e-05, "optim/total_tokens": 1958807076864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3059849739074707, "created_at": "2025-06-03T06:33:10.207325+00:00"} {"global_step": 233509, "acc_step": 0, "speed/wps": 5513.859730341654, "speed/FLOPS": 243684377588570.28, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045597054064273834, "optim/lr": 1.9481360218934764e-05, "optim/total_tokens": 1958815465472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2897989749908447, "created_at": "2025-06-03T06:33:13.182974+00:00"} {"global_step": 233510, "acc_step": 0, "speed/wps": 5519.170709911613, "speed/FLOPS": 243919095701504.75, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04919593036174774, "optim/lr": 1.9477812993840214e-05, "optim/total_tokens": 1958823854080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2882550954818726, "created_at": "2025-06-03T06:33:16.156960+00:00"} {"global_step": 233511, "acc_step": 0, "speed/wps": 5518.563030156042, "speed/FLOPS": 243892239366695.47, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04370627552270889, "optim/lr": 1.9474265768745668e-05, "optim/total_tokens": 1958832242688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2950297594070435, "created_at": "2025-06-03T06:33:19.128848+00:00"} {"global_step": 233512, "acc_step": 0, "speed/wps": 5518.592232479375, "speed/FLOPS": 243893529959915.72, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046938639134168625, "optim/lr": 1.9470718543651345e-05, "optim/total_tokens": 1958840631296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.306631088256836, "created_at": "2025-06-03T06:33:22.101626+00:00"} {"global_step": 233513, "acc_step": 0, "speed/wps": 5508.438249032931, "speed/FLOPS": 243444775864381.66, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04425344616174698, "optim/lr": 1.94671713185568e-05, "optim/total_tokens": 1958849019904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2885373830795288, "created_at": "2025-06-03T06:33:25.084738+00:00"} {"global_step": 233514, "acc_step": 0, "speed/wps": 5506.799224713067, "speed/FLOPS": 243372339378730.62, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04840109124779701, "optim/lr": 1.9463624093462252e-05, "optim/total_tokens": 1958857408512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.3001066446304321, "created_at": "2025-06-03T06:33:28.064494+00:00"} {"global_step": 233515, "acc_step": 0, "speed/wps": 5499.788030944843, "speed/FLOPS": 243062480500718.03, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.54 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.54, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043645840138196945, "optim/lr": 1.9460076868367703e-05, "optim/total_tokens": 1958865797120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2760735750198364, "created_at": "2025-06-03T06:33:31.049065+00:00"} {"global_step": 233516, "acc_step": 0, "speed/wps": 5507.803445896708, "speed/FLOPS": 243416720814977.6, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.53 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.53, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04843906685709953, "optim/lr": 1.945652964327338e-05, "optim/total_tokens": 1958874185728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2804796695709229, "created_at": "2025-06-03T06:33:34.030738+00:00"} {"global_step": 233517, "acc_step": 0, "speed/wps": 5533.638196152182, "speed/FLOPS": 244558484542030.4, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 191.98, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.042981866747140884, "optim/lr": 1.9452982418178834e-05, "optim/total_tokens": 1958882574336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2839462757110596, "created_at": "2025-06-03T06:33:36.994899+00:00"} {"global_step": 233518, "acc_step": 0, "speed/wps": 5517.761086584263, "speed/FLOPS": 243856797565542.12, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044220153242349625, "optim/lr": 1.9449435193084287e-05, "optim/total_tokens": 1958890962944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2968319654464722, "created_at": "2025-06-03T06:33:39.969690+00:00"} {"global_step": 233519, "acc_step": 0, "speed/wps": 5518.110876111762, "speed/FLOPS": 243872256472272.5, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04402077570557594, "optim/lr": 1.944588796798974e-05, "optim/total_tokens": 1958899351552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2914226055145264, "created_at": "2025-06-03T06:33:42.946770+00:00"} {"global_step": 233520, "acc_step": 0, "speed/wps": 5521.110561174921, "speed/FLOPS": 244004827198284.1, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0427868515253067, "optim/lr": 1.9442340742895415e-05, "optim/total_tokens": 1958907740160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2780380249023438, "created_at": "2025-06-03T06:33:45.919247+00:00"} {"global_step": 233521, "acc_step": 0, "speed/wps": 5511.020797603862, "speed/FLOPS": 243558911292534.9, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0463922880589962, "optim/lr": 1.9438793517800868e-05, "optim/total_tokens": 1958916128768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.271946668624878, "created_at": "2025-06-03T06:33:48.899953+00:00"} {"global_step": 233522, "acc_step": 0, "speed/wps": 5515.175489724323, "speed/FLOPS": 243742527418617.22, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0439554825425148, "optim/lr": 1.9435246292706322e-05, "optim/total_tokens": 1958924517376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.27507483959198, "created_at": "2025-06-03T06:33:51.874566+00:00"} {"global_step": 233523, "acc_step": 0, "speed/wps": 5512.374429359471, "speed/FLOPS": 243618734887617.4, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05190832540392876, "optim/lr": 1.9431699067611775e-05, "optim/total_tokens": 1958932905984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.3003312349319458, "created_at": "2025-06-03T06:33:54.850615+00:00"} {"global_step": 233524, "acc_step": 0, "speed/wps": 5512.711712541599, "speed/FLOPS": 243633641077895.66, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043402865529060364, "optim/lr": 1.942815184251745e-05, "optim/total_tokens": 1958941294592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2975252866744995, "created_at": "2025-06-03T06:33:57.826204+00:00"} {"global_step": 233525, "acc_step": 0, "speed/wps": 5518.155517422792, "speed/FLOPS": 243874229389725.1, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.049204327166080475, "optim/lr": 1.9424604617422903e-05, "optim/total_tokens": 1958949683200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.27677321434021, "created_at": "2025-06-03T06:34:00.803540+00:00"} {"global_step": 233526, "acc_step": 0, "speed/wps": 5513.71735531398, "speed/FLOPS": 243678085341088.56, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04304078593850136, "optim/lr": 1.9421057392328356e-05, "optim/total_tokens": 1958958071808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2701797485351562, "created_at": "2025-06-03T06:34:03.779982+00:00"} {"global_step": 233527, "acc_step": 0, "speed/wps": 5514.8404402943015, "speed/FLOPS": 243727719948748.75, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04420638456940651, "optim/lr": 1.941751016723403e-05, "optim/total_tokens": 1958966460416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2988204956054688, "created_at": "2025-06-03T06:34:06.757657+00:00"} {"global_step": 233528, "acc_step": 0, "speed/wps": 5506.131500077349, "speed/FLOPS": 243342829367556.44, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.051300160586833954, "optim/lr": 1.9413962942139484e-05, "optim/total_tokens": 1958974849024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.294737458229065, "created_at": "2025-06-03T06:34:09.736653+00:00"} {"global_step": 233529, "acc_step": 0, "speed/wps": 5512.921842776118, "speed/FLOPS": 243642927758717.34, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045391745865345, "optim/lr": 1.9410415717044937e-05, "optim/total_tokens": 1958983237632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.273790717124939, "created_at": "2025-06-03T06:34:12.711835+00:00"} {"global_step": 233530, "acc_step": 0, "speed/wps": 5510.72352732613, "speed/FLOPS": 243545773467826.38, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05078958347439766, "optim/lr": 1.940686849195039e-05, "optim/total_tokens": 1958991626240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3050017356872559, "created_at": "2025-06-03T06:34:15.689334+00:00"} {"global_step": 233531, "acc_step": 0, "speed/wps": 5505.640083452694, "speed/FLOPS": 243321111268044.97, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.52 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.52, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046175383031368256, "optim/lr": 1.9403321266856065e-05, "optim/total_tokens": 1959000014848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2765625715255737, "created_at": "2025-06-03T06:34:18.674078+00:00"} {"global_step": 233532, "acc_step": 0, "speed/wps": 5528.804584442501, "speed/FLOPS": 244344863645130.06, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04725589230656624, "optim/lr": 1.939977404176152e-05, "optim/total_tokens": 1959008403456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2945224046707153, "created_at": "2025-06-03T06:34:21.644895+00:00"} {"global_step": 233533, "acc_step": 0, "speed/wps": 5524.906574907657, "speed/FLOPS": 244172591575511.4, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04284907132387161, "optim/lr": 1.9396226816666972e-05, "optim/total_tokens": 1959016792064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2966303825378418, "created_at": "2025-06-03T06:34:24.613726+00:00"} {"global_step": 233534, "acc_step": 0, "speed/wps": 5509.992603327687, "speed/FLOPS": 243513470368303.38, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04708954691886902, "optim/lr": 1.9392679591572426e-05, "optim/total_tokens": 1959025180672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2774673700332642, "created_at": "2025-06-03T06:34:27.597125+00:00"} {"global_step": 233535, "acc_step": 0, "speed/wps": 5506.420410212955, "speed/FLOPS": 243355597716774.1, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04366792365908623, "optim/lr": 1.9389132366478103e-05, "optim/total_tokens": 1959033569280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2855898141860962, "created_at": "2025-06-03T06:34:30.579170+00:00"} {"global_step": 233536, "acc_step": 0, "speed/wps": 5515.548997474328, "speed/FLOPS": 243759034549381.47, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0433950237929821, "optim/lr": 1.9385585141383557e-05, "optim/total_tokens": 1959041957888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2923692464828491, "created_at": "2025-06-03T06:34:33.552974+00:00"} {"global_step": 233537, "acc_step": 0, "speed/wps": 5520.891602367954, "speed/FLOPS": 243995150339748.94, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04813140258193016, "optim/lr": 1.9382037916289007e-05, "optim/total_tokens": 1959050346496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2961900234222412, "created_at": "2025-06-03T06:34:36.524142+00:00"} {"global_step": 233538, "acc_step": 0, "speed/wps": 5514.812467933667, "speed/FLOPS": 243726483713584.22, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04310499504208565, "optim/lr": 1.937849069119446e-05, "optim/total_tokens": 1959058735104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2763195037841797, "created_at": "2025-06-03T06:34:39.498313+00:00"} {"global_step": 233539, "acc_step": 0, "speed/wps": 5517.273660700399, "speed/FLOPS": 243835255836347.2, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0491194911301136, "optim/lr": 1.9374943466100138e-05, "optim/total_tokens": 1959067123712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.281144618988037, "created_at": "2025-06-03T06:34:42.475590+00:00"} {"global_step": 233540, "acc_step": 0, "speed/wps": 5515.53033547575, "speed/FLOPS": 243758209784565.1, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0437309592962265, "optim/lr": 1.937139624100559e-05, "optim/total_tokens": 1959075512320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2847641706466675, "created_at": "2025-06-03T06:34:45.451180+00:00"} {"global_step": 233541, "acc_step": 0, "speed/wps": 5523.654349980811, "speed/FLOPS": 244117249643213.03, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05001667141914368, "optim/lr": 1.9367849015911045e-05, "optim/total_tokens": 1959083900928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2737407684326172, "created_at": "2025-06-03T06:34:48.421010+00:00"} {"global_step": 233542, "acc_step": 0, "speed/wps": 5527.132909054117, "speed/FLOPS": 244270984149373.75, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.17, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044301293790340424, "optim/lr": 1.9364301790816495e-05, "optim/total_tokens": 1959092289536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.294899582862854, "created_at": "2025-06-03T06:34:51.388796+00:00"} {"global_step": 233543, "acc_step": 0, "speed/wps": 5524.328402907015, "speed/FLOPS": 244147039332435.6, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04376911371946335, "optim/lr": 1.9360754565722172e-05, "optim/total_tokens": 1959100678144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2832683324813843, "created_at": "2025-06-03T06:34:54.358149+00:00"} {"global_step": 233544, "acc_step": 0, "speed/wps": 5520.774157889604, "speed/FLOPS": 243989959894941.22, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043987926095724106, "optim/lr": 1.9357207340627626e-05, "optim/total_tokens": 1959109066752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2772634029388428, "created_at": "2025-06-03T06:34:57.329305+00:00"} {"global_step": 233545, "acc_step": 0, "speed/wps": 5522.574155932837, "speed/FLOPS": 244069510595226.94, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043692246079444885, "optim/lr": 1.935366011553308e-05, "optim/total_tokens": 1959117455360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2886595726013184, "created_at": "2025-06-03T06:35:00.304505+00:00"} {"global_step": 233546, "acc_step": 0, "speed/wps": 5507.292502542258, "speed/FLOPS": 243394139733956.1, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04313052445650101, "optim/lr": 1.9350112890438533e-05, "optim/total_tokens": 1959125843968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2828952074050903, "created_at": "2025-06-03T06:35:03.284232+00:00"} {"global_step": 233547, "acc_step": 0, "speed/wps": 5510.930373112169, "speed/FLOPS": 243554914992836.6, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04421914368867874, "optim/lr": 1.9346565665344207e-05, "optim/total_tokens": 1959134232576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2917613983154297, "created_at": "2025-06-03T06:35:06.261405+00:00"} {"global_step": 233548, "acc_step": 0, "speed/wps": 5494.552931358507, "speed/FLOPS": 242831115894670.75, "speed/curr_iter_time": 2.9807, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9807, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043302569538354874, "optim/lr": 1.934301844024966e-05, "optim/total_tokens": 1959142621184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2782049179077148, "created_at": "2025-06-03T06:35:09.247065+00:00"} {"global_step": 233549, "acc_step": 0, "speed/wps": 5502.092134894803, "speed/FLOPS": 243164310101833.16, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.51 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.51, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04366172477602959, "optim/lr": 1.9339471215155114e-05, "optim/total_tokens": 1959151009792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2875251770019531, "created_at": "2025-06-03T06:35:12.231900+00:00"} {"global_step": 233550, "acc_step": 0, "speed/wps": 5528.932390120569, "speed/FLOPS": 244350512001931.88, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04459042474627495, "optim/lr": 1.9335923990060568e-05, "optim/total_tokens": 1959159398400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2837289571762085, "created_at": "2025-06-03T06:35:15.198836+00:00"} {"global_step": 233551, "acc_step": 0, "speed/wps": 5522.042925096343, "speed/FLOPS": 244046032911339.8, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04323282465338707, "optim/lr": 1.933237676496624e-05, "optim/total_tokens": 1959167787008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2890701293945312, "created_at": "2025-06-03T06:35:18.169151+00:00"} {"global_step": 233552, "acc_step": 0, "speed/wps": 5525.565577873098, "speed/FLOPS": 244201716133500.94, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043659843504428864, "optim/lr": 1.9328829539871695e-05, "optim/total_tokens": 1959176175616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2911168336868286, "created_at": "2025-06-03T06:35:21.138578+00:00"} {"global_step": 233553, "acc_step": 0, "speed/wps": 5521.314817906298, "speed/FLOPS": 244013854300330.25, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04379010200500488, "optim/lr": 1.932528231477715e-05, "optim/total_tokens": 1959184564224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.287817120552063, "created_at": "2025-06-03T06:35:24.112737+00:00"} {"global_step": 233554, "acc_step": 0, "speed/wps": 5510.802378966269, "speed/FLOPS": 243549258306721.25, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043874166905879974, "optim/lr": 1.9321735089682823e-05, "optim/total_tokens": 1959192952832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2747224569320679, "created_at": "2025-06-03T06:35:27.090250+00:00"} {"global_step": 233555, "acc_step": 0, "speed/wps": 5505.481364428858, "speed/FLOPS": 243314096699589.03, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04540614038705826, "optim/lr": 1.9318187864588276e-05, "optim/total_tokens": 1959201341440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.274446725845337, "created_at": "2025-06-03T06:35:30.071154+00:00"} {"global_step": 233556, "acc_step": 0, "speed/wps": 5506.1863156297595, "speed/FLOPS": 243345251934401.53, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04353678226470947, "optim/lr": 1.931464063949373e-05, "optim/total_tokens": 1959209730048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2765856981277466, "created_at": "2025-06-03T06:35:33.053190+00:00"} {"global_step": 233557, "acc_step": 0, "speed/wps": 5505.257705426962, "speed/FLOPS": 243304212116495.78, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.5 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.5, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.056599508970975876, "optim/lr": 1.9311093414399183e-05, "optim/total_tokens": 1959218118656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.278918981552124, "created_at": "2025-06-03T06:35:36.033929+00:00"} {"global_step": 233558, "acc_step": 0, "speed/wps": 5517.1002488960285, "speed/FLOPS": 243827591922196.1, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04630649834871292, "optim/lr": 1.9307546189304857e-05, "optim/total_tokens": 1959226507264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.3120232820510864, "created_at": "2025-06-03T06:35:39.007689+00:00"} {"global_step": 233559, "acc_step": 0, "speed/wps": 5518.302742155669, "speed/FLOPS": 243880735969353.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04484034329652786, "optim/lr": 1.930399896421031e-05, "optim/total_tokens": 1959234895872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2846897840499878, "created_at": "2025-06-03T06:35:41.980407+00:00"} {"global_step": 233560, "acc_step": 0, "speed/wps": 5511.91448210555, "speed/FLOPS": 243598407573217.56, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04545827955007553, "optim/lr": 1.9300451739115764e-05, "optim/total_tokens": 1959243284480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2797610759735107, "created_at": "2025-06-03T06:35:44.956806+00:00"} {"global_step": 233561, "acc_step": 0, "speed/wps": 5514.037731934392, "speed/FLOPS": 243692244347874.56, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05085863918066025, "optim/lr": 1.9296904514021218e-05, "optim/total_tokens": 1959251673088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2877134084701538, "created_at": "2025-06-03T06:35:47.933349+00:00"} {"global_step": 233562, "acc_step": 0, "speed/wps": 5519.301716461755, "speed/FLOPS": 243924885520468.72, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04229608178138733, "optim/lr": 1.9293357288926895e-05, "optim/total_tokens": 1959260061696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2731752395629883, "created_at": "2025-06-03T06:35:50.905255+00:00"} {"global_step": 233563, "acc_step": 0, "speed/wps": 5518.20472733773, "speed/FLOPS": 243876404216086.16, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.050670523196458817, "optim/lr": 1.9289810063832346e-05, "optim/total_tokens": 1959268450304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2760064601898193, "created_at": "2025-06-03T06:35:53.877438+00:00"} {"global_step": 233564, "acc_step": 0, "speed/wps": 5503.450949955566, "speed/FLOPS": 243224362772472.9, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04433760046958923, "optim/lr": 1.92862628387378e-05, "optim/total_tokens": 1959276838912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.291586995124817, "created_at": "2025-06-03T06:35:56.862109+00:00"} {"global_step": 233565, "acc_step": 0, "speed/wps": 5510.396396442343, "speed/FLOPS": 243531315957170.62, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05072994530200958, "optim/lr": 1.9282715613643253e-05, "optim/total_tokens": 1959285227520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.277347207069397, "created_at": "2025-06-03T06:35:59.839750+00:00"} {"global_step": 233566, "acc_step": 0, "speed/wps": 5506.302986443137, "speed/FLOPS": 243350408187177.47, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.49 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.49, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043891582638025284, "optim/lr": 1.927916838854893e-05, "optim/total_tokens": 1959293616128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2759908437728882, "created_at": "2025-06-03T06:36:02.818425+00:00"} {"global_step": 233567, "acc_step": 0, "speed/wps": 5525.105724230391, "speed/FLOPS": 244181392956237.62, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04606155306100845, "optim/lr": 1.9275621163454384e-05, "optim/total_tokens": 1959302004736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2712671756744385, "created_at": "2025-06-03T06:36:05.787099+00:00"} {"global_step": 233568, "acc_step": 0, "speed/wps": 5527.071114347497, "speed/FLOPS": 244268253139635.16, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.25, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04273713752627373, "optim/lr": 1.9272073938359834e-05, "optim/total_tokens": 1959310393344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2804442644119263, "created_at": "2025-06-03T06:36:08.758581+00:00"} {"global_step": 233569, "acc_step": 0, "speed/wps": 5530.172613996255, "speed/FLOPS": 244405323549195.94, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.08, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04557187855243683, "optim/lr": 1.9268526713265287e-05, "optim/total_tokens": 1959318781952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2915115356445312, "created_at": "2025-06-03T06:36:11.727791+00:00"} {"global_step": 233570, "acc_step": 0, "speed/wps": 5518.35009256567, "speed/FLOPS": 243882828615114.4, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043852221220731735, "optim/lr": 1.9264979488170965e-05, "optim/total_tokens": 1959327170560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2780873775482178, "created_at": "2025-06-03T06:36:14.704337+00:00"} {"global_step": 233571, "acc_step": 0, "speed/wps": 5524.145020240665, "speed/FLOPS": 244138934757220.5, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046159256249666214, "optim/lr": 1.9261432263076418e-05, "optim/total_tokens": 1959335559168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2825603485107422, "created_at": "2025-06-03T06:36:17.673447+00:00"} {"global_step": 233572, "acc_step": 0, "speed/wps": 5515.30294055632, "speed/FLOPS": 243748160093039.03, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0431659072637558, "optim/lr": 1.9257885037981872e-05, "optim/total_tokens": 1959343947776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.299922227859497, "created_at": "2025-06-03T06:36:20.647624+00:00"} {"global_step": 233573, "acc_step": 0, "speed/wps": 5518.172670973199, "speed/FLOPS": 243874987488853.25, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.051829636096954346, "optim/lr": 1.9254337812887322e-05, "optim/total_tokens": 1959352336384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2839183807373047, "created_at": "2025-06-03T06:36:23.620905+00:00"} {"global_step": 233574, "acc_step": 0, "speed/wps": 5508.2451103863295, "speed/FLOPS": 243436240124775.06, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04533737897872925, "optim/lr": 1.9250790587793e-05, "optim/total_tokens": 1959360724992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2945611476898193, "created_at": "2025-06-03T06:36:26.601638+00:00"} {"global_step": 233575, "acc_step": 0, "speed/wps": 5522.111116637428, "speed/FLOPS": 244049046628419.78, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04956419765949249, "optim/lr": 1.9247243362698453e-05, "optim/total_tokens": 1959369113600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2742135524749756, "created_at": "2025-06-03T06:36:29.572067+00:00"} {"global_step": 233576, "acc_step": 0, "speed/wps": 5527.776417478913, "speed/FLOPS": 244299423927975.03, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04397166892886162, "optim/lr": 1.9243696137603906e-05, "optim/total_tokens": 1959377502208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.271329641342163, "created_at": "2025-06-03T06:36:32.543021+00:00"} {"global_step": 233577, "acc_step": 0, "speed/wps": 5520.72092995833, "speed/FLOPS": 243987607492824.16, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.054284777492284775, "optim/lr": 1.924014891250936e-05, "optim/total_tokens": 1959385890816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.286635160446167, "created_at": "2025-06-03T06:36:35.517577+00:00"} {"global_step": 233578, "acc_step": 0, "speed/wps": 5528.67528869351, "speed/FLOPS": 244339149434820.28, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044665973633527756, "optim/lr": 1.9236601687415034e-05, "optim/total_tokens": 1959394279424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2880650758743286, "created_at": "2025-06-03T06:36:38.484359+00:00"} {"global_step": 233579, "acc_step": 0, "speed/wps": 5510.349150928039, "speed/FLOPS": 243529227947262.88, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05212925747036934, "optim/lr": 1.9233054462320488e-05, "optim/total_tokens": 1959402668032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2649372816085815, "created_at": "2025-06-03T06:36:41.466235+00:00"} {"global_step": 233580, "acc_step": 0, "speed/wps": 5516.3562229642375, "speed/FLOPS": 243794709784280.88, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04394331946969032, "optim/lr": 1.922950723722594e-05, "optim/total_tokens": 1959411056640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2685166597366333, "created_at": "2025-06-03T06:36:44.446056+00:00"} {"global_step": 233581, "acc_step": 0, "speed/wps": 5507.583593294875, "speed/FLOPS": 243407004455284.2, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04790463298559189, "optim/lr": 1.9225960012131615e-05, "optim/total_tokens": 1959419445248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2808421850204468, "created_at": "2025-06-03T06:36:47.424344+00:00"} {"global_step": 233582, "acc_step": 0, "speed/wps": 5505.675119577801, "speed/FLOPS": 243322659685443.53, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.48 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.48, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04340049996972084, "optim/lr": 1.922241278703707e-05, "optim/total_tokens": 1959427833856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.294820785522461, "created_at": "2025-06-03T06:36:50.407067+00:00"} {"global_step": 233583, "acc_step": 0, "speed/wps": 5522.018913030225, "speed/FLOPS": 244044971700922.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04623283073306084, "optim/lr": 1.9218865561942522e-05, "optim/total_tokens": 1959436222464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2798088788986206, "created_at": "2025-06-03T06:36:53.378058+00:00"} {"global_step": 233584, "acc_step": 0, "speed/wps": 5526.059178507636, "speed/FLOPS": 244223530755070.44, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.3, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04479748755693436, "optim/lr": 1.9215318336847976e-05, "optim/total_tokens": 1959444611072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2903159856796265, "created_at": "2025-06-03T06:36:56.347394+00:00"} {"global_step": 233585, "acc_step": 0, "speed/wps": 5519.749309498415, "speed/FLOPS": 243944666841700.25, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043231301009655, "optim/lr": 1.921177111175365e-05, "optim/total_tokens": 1959452999680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.279754638671875, "created_at": "2025-06-03T06:36:59.321513+00:00"} {"global_step": 233586, "acc_step": 0, "speed/wps": 5518.89182093862, "speed/FLOPS": 243906770236381.66, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04474109038710594, "optim/lr": 1.9208223886659103e-05, "optim/total_tokens": 1959461388288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2853902578353882, "created_at": "2025-06-03T06:37:02.297230+00:00"} {"global_step": 233587, "acc_step": 0, "speed/wps": 5519.563651674793, "speed/FLOPS": 243936461716179.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05018484964966774, "optim/lr": 1.9204676661564557e-05, "optim/total_tokens": 1959469776896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2902241945266724, "created_at": "2025-06-03T06:37:05.268894+00:00"} {"global_step": 233588, "acc_step": 0, "speed/wps": 5508.161274887917, "speed/FLOPS": 243432535024854.22, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046458061784505844, "optim/lr": 1.920112943647001e-05, "optim/total_tokens": 1959478165504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2883355617523193, "created_at": "2025-06-03T06:37:08.250351+00:00"} {"global_step": 233589, "acc_step": 0, "speed/wps": 5503.127323508254, "speed/FLOPS": 243210060139972.06, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.044322896748781204, "optim/lr": 1.9197582211375684e-05, "optim/total_tokens": 1959486554112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.269612431526184, "created_at": "2025-06-03T06:37:11.235167+00:00"} {"global_step": 233590, "acc_step": 0, "speed/wps": 5500.266461491472, "speed/FLOPS": 243083624682049.5, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04761712998151779, "optim/lr": 1.9194034986281138e-05, "optim/total_tokens": 1959494942720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2786865234375, "created_at": "2025-06-03T06:37:14.218253+00:00"} {"global_step": 233591, "acc_step": 0, "speed/wps": 5505.320077614541, "speed/FLOPS": 243306968647936.97, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05065470188856125, "optim/lr": 1.919048776118659e-05, "optim/total_tokens": 1959503331328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2774068117141724, "created_at": "2025-06-03T06:37:17.198371+00:00"} {"global_step": 233592, "acc_step": 0, "speed/wps": 5535.766622449409, "speed/FLOPS": 244652550090094.47, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 191.9, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04533606395125389, "optim/lr": 1.9186940536092045e-05, "optim/total_tokens": 1959511719936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2768117189407349, "created_at": "2025-06-03T06:37:20.165513+00:00"} {"global_step": 233593, "acc_step": 0, "speed/wps": 5521.007931235919, "speed/FLOPS": 244000291480287.9, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04866921156644821, "optim/lr": 1.9183393310997722e-05, "optim/total_tokens": 1959520108544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.282976746559143, "created_at": "2025-06-03T06:37:23.141472+00:00"} {"global_step": 233594, "acc_step": 0, "speed/wps": 5515.9414366581805, "speed/FLOPS": 243776378352621.94, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04360998794436455, "optim/lr": 1.9179846085903176e-05, "optim/total_tokens": 1959528497152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2911444902420044, "created_at": "2025-06-03T06:37:26.115837+00:00"} {"global_step": 233595, "acc_step": 0, "speed/wps": 5535.256861973517, "speed/FLOPS": 244630021286250.66, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.05001761019229889, "optim/lr": 1.9176298860808626e-05, "optim/total_tokens": 1959536885760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2742016315460205, "created_at": "2025-06-03T06:37:29.079151+00:00"} {"global_step": 233596, "acc_step": 0, "speed/wps": 5512.4984049084605, "speed/FLOPS": 243624213972318.38, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04406113550066948, "optim/lr": 1.917275163571408e-05, "optim/total_tokens": 1959545274368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2883015871047974, "created_at": "2025-06-03T06:37:32.054670+00:00"} {"global_step": 233597, "acc_step": 0, "speed/wps": 5511.892899797371, "speed/FLOPS": 243597453745664.3, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.049886494874954224, "optim/lr": 1.9169204410619757e-05, "optim/total_tokens": 1959553662976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2908786535263062, "created_at": "2025-06-03T06:37:35.036108+00:00"} {"global_step": 233598, "acc_step": 0, "speed/wps": 5501.025968029772, "speed/FLOPS": 243117190983535.5, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.47 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.47, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04421740025281906, "optim/lr": 1.916565718552521e-05, "optim/total_tokens": 1959562051584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2763819694519043, "created_at": "2025-06-03T06:37:38.018824+00:00"} {"global_step": 233599, "acc_step": 0, "speed/wps": 5510.950479607471, "speed/FLOPS": 243555803597014.56, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0469597764313221, "optim/lr": 1.9162109960430664e-05, "optim/total_tokens": 1959570440192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.290287733078003, "created_at": "2025-06-03T06:37:40.998630+00:00"} {"global_step": 233600, "acc_step": 0, "speed/wps": 5518.762954645552, "speed/FLOPS": 243901075005825.5, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04530511051416397, "optim/lr": 1.9158562735336114e-05, "optim/total_tokens": 1959578828800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2600195407867432, "created_at": "2025-06-03T06:37:43.973242+00:00"} {"global_step": 233601, "acc_step": 0, "speed/wps": 5522.304037568136, "speed/FLOPS": 244057572746098.25, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.046904198825359344, "optim/lr": 1.915501551024179e-05, "optim/total_tokens": 1959587217408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2910605669021606, "created_at": "2025-06-03T06:37:46.943436+00:00"} {"global_step": 233602, "acc_step": 0, "speed/wps": 5518.64086677303, "speed/FLOPS": 243895679346762.44, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04576970264315605, "optim/lr": 1.9151468285147245e-05, "optim/total_tokens": 1959595606016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2846935987472534, "created_at": "2025-06-03T06:37:49.917634+00:00"} {"global_step": 233603, "acc_step": 0, "speed/wps": 5515.198696234485, "speed/FLOPS": 243743553027584.72, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.07472538203001022, "optim/lr": 1.91479210600527e-05, "optim/total_tokens": 1959603994624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2823795080184937, "created_at": "2025-06-03T06:37:52.894176+00:00"} {"global_step": 233604, "acc_step": 0, "speed/wps": 5512.4533563205305, "speed/FLOPS": 243622223055311.44, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04738079383969307, "optim/lr": 1.9144373834958152e-05, "optim/total_tokens": 1959612383232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.3020135164260864, "created_at": "2025-06-03T06:37:55.869589+00:00"} {"global_step": 233605, "acc_step": 0, "speed/wps": 5521.008290765859, "speed/FLOPS": 244000307369670.97, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043590154498815536, "optim/lr": 1.9140826609863826e-05, "optim/total_tokens": 1959620771840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2817020416259766, "created_at": "2025-06-03T06:37:58.840411+00:00"} {"global_step": 233606, "acc_step": 0, "speed/wps": 5497.2963713700365, "speed/FLOPS": 242952361900981.44, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.46 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.46, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043997809290885925, "optim/lr": 1.913727938476928e-05, "optim/total_tokens": 1959629160448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.287216305732727, "created_at": "2025-06-03T06:38:01.824243+00:00"} {"global_step": 233607, "acc_step": 0, "speed/wps": 5510.071173022074, "speed/FLOPS": 243516942746639.1, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04324107617139816, "optim/lr": 1.9133732159674733e-05, "optim/total_tokens": 1959637549056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2852762937545776, "created_at": "2025-06-03T06:38:04.804875+00:00"} {"global_step": 233608, "acc_step": 0, "speed/wps": 5520.630992021071, "speed/FLOPS": 243983632696341.38, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0437234565615654, "optim/lr": 1.9130184934580407e-05, "optim/total_tokens": 1959645937664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2768044471740723, "created_at": "2025-06-03T06:38:07.778471+00:00"} {"global_step": 233609, "acc_step": 0, "speed/wps": 5526.531789176512, "speed/FLOPS": 244244417727594.06, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043468642979860306, "optim/lr": 1.912663770948586e-05, "optim/total_tokens": 1959654326272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2797229290008545, "created_at": "2025-06-03T06:38:10.747160+00:00"} {"global_step": 233610, "acc_step": 0, "speed/wps": 5519.650328451737, "speed/FLOPS": 243940292386068.0, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04310283064842224, "optim/lr": 1.9123090484391315e-05, "optim/total_tokens": 1959662714880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2789980173110962, "created_at": "2025-06-03T06:38:13.718784+00:00"} {"global_step": 233611, "acc_step": 0, "speed/wps": 5519.358745681638, "speed/FLOPS": 243927405920085.53, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.0444343127310276, "optim/lr": 1.9119543259296768e-05, "optim/total_tokens": 1959671103488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2673813104629517, "created_at": "2025-06-03T06:38:16.692745+00:00"} {"global_step": 233612, "acc_step": 0, "speed/wps": 5531.802519496237, "speed/FLOPS": 244477357029682.53, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04685352370142937, "optim/lr": 1.9115996034202442e-05, "optim/total_tokens": 1959679492096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2935912609100342, "created_at": "2025-06-03T06:38:19.662292+00:00"} {"global_step": 233613, "acc_step": 0, "speed/wps": 5506.416429722599, "speed/FLOPS": 243355421799474.3, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.045317698270082474, "optim/lr": 1.9112448809107896e-05, "optim/total_tokens": 1959687880704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2850614786148071, "created_at": "2025-06-03T06:38:22.641259+00:00"} {"global_step": 233614, "acc_step": 0, "speed/wps": 5502.126983048281, "speed/FLOPS": 243165850211847.84, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043222252279520035, "optim/lr": 1.910890158401335e-05, "optim/total_tokens": 1959696269312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.286700963973999, "created_at": "2025-06-03T06:38:25.623023+00:00"} {"global_step": 233615, "acc_step": 0, "speed/wps": 5500.160752211738, "speed/FLOPS": 243078952872954.44, "speed/curr_iter_time": 2.9777, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9777, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043638505041599274, "optim/lr": 1.9105354358918803e-05, "optim/total_tokens": 1959704657920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2789204120635986, "created_at": "2025-06-03T06:38:28.605848+00:00"} {"global_step": 233616, "acc_step": 0, "speed/wps": 5504.927409303201, "speed/FLOPS": 243289614718434.34, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04345390573143959, "optim/lr": 1.9101807133824477e-05, "optim/total_tokens": 1959713046528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2737417221069336, "created_at": "2025-06-03T06:38:31.585578+00:00"} {"global_step": 233617, "acc_step": 0, "speed/wps": 5512.572746620733, "speed/FLOPS": 243627499495485.44, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.043383821845054626, "optim/lr": 1.909825990872993e-05, "optim/total_tokens": 1959721435136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.282447099685669, "created_at": "2025-06-03T06:38:34.561450+00:00"} {"global_step": 233618, "acc_step": 0, "speed/wps": 5530.9208183195215, "speed/FLOPS": 244438390350627.44, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0432734377682209, "optim/lr": 1.9094712683635384e-05, "optim/total_tokens": 1959729823744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.277935266494751, "created_at": "2025-06-03T06:38:37.530158+00:00"} {"global_step": 233619, "acc_step": 0, "speed/wps": 5528.767455830802, "speed/FLOPS": 244343222750534.4, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.16, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04509557783603668, "optim/lr": 1.9091165458540837e-05, "optim/total_tokens": 1959738212352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2802212238311768, "created_at": "2025-06-03T06:38:40.499752+00:00"} {"global_step": 233620, "acc_step": 0, "speed/wps": 5514.761250477673, "speed/FLOPS": 243724220164183.97, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.042917877435684204, "optim/lr": 1.9087618233446515e-05, "optim/total_tokens": 1959746600960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2888277769088745, "created_at": "2025-06-03T06:38:43.474673+00:00"} {"global_step": 233621, "acc_step": 0, "speed/wps": 5519.749742902518, "speed/FLOPS": 243944685995943.25, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04706800729036331, "optim/lr": 1.9084071008351965e-05, "optim/total_tokens": 1959754989568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2917368412017822, "created_at": "2025-06-03T06:38:46.447492+00:00"} {"global_step": 233622, "acc_step": 0, "speed/wps": 5502.105662308502, "speed/FLOPS": 243164907944279.1, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.45 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.45, "speed/est_time_remaining_days": 0.19, "optim/grad_norm": 0.04316341504454613, "optim/lr": 1.908052378325742e-05, "optim/total_tokens": 1959763378176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.275526762008667, "created_at": "2025-06-03T06:38:49.428583+00:00"} {"global_step": 233623, "acc_step": 0, "speed/wps": 5514.589927035801, "speed/FLOPS": 243716648544966.12, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045284077525138855, "optim/lr": 1.9076976558162872e-05, "optim/total_tokens": 1959771766784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.271135687828064, "created_at": "2025-06-03T06:38:52.402821+00:00"} {"global_step": 233624, "acc_step": 0, "speed/wps": 5513.955137614156, "speed/FLOPS": 243688594101676.22, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04629647359251976, "optim/lr": 1.907342933306855e-05, "optim/total_tokens": 1959780155392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2904139757156372, "created_at": "2025-06-03T06:38:55.377556+00:00"} {"global_step": 233625, "acc_step": 0, "speed/wps": 5513.230201680174, "speed/FLOPS": 243656555643952.7, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.44 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.44, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04348261281847954, "optim/lr": 1.9069882107974003e-05, "optim/total_tokens": 1959788544000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2903592586517334, "created_at": "2025-06-03T06:38:58.354975+00:00"} {"global_step": 233626, "acc_step": 0, "speed/wps": 5526.231985234991, "speed/FLOPS": 244231167927914.53, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.26, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0439385287463665, "optim/lr": 1.9066334882879453e-05, "optim/total_tokens": 1959796932608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2723203897476196, "created_at": "2025-06-03T06:39:01.327342+00:00"} {"global_step": 233627, "acc_step": 0, "speed/wps": 5519.890966123055, "speed/FLOPS": 243950927339445.0, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04377494752407074, "optim/lr": 1.9062787657784907e-05, "optim/total_tokens": 1959805321216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2866389751434326, "created_at": "2025-06-03T06:39:04.299546+00:00"} {"global_step": 233628, "acc_step": 0, "speed/wps": 5518.678694375141, "speed/FLOPS": 243897351133156.53, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04387417808175087, "optim/lr": 1.9059240432690584e-05, "optim/total_tokens": 1959813709824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2826942205429077, "created_at": "2025-06-03T06:39:07.271989+00:00"} {"global_step": 233629, "acc_step": 0, "speed/wps": 5512.302182924533, "speed/FLOPS": 243615541964983.94, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.048610977828502655, "optim/lr": 1.9055693207596038e-05, "optim/total_tokens": 1959822098432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.286278486251831, "created_at": "2025-06-03T06:39:10.247749+00:00"} {"global_step": 233630, "acc_step": 0, "speed/wps": 5510.032203067547, "speed/FLOPS": 243515220474115.34, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04508887231349945, "optim/lr": 1.905214598250149e-05, "optim/total_tokens": 1959830487040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.279221773147583, "created_at": "2025-06-03T06:39:13.224717+00:00"} {"global_step": 233631, "acc_step": 0, "speed/wps": 5518.93599919116, "speed/FLOPS": 243908722689019.1, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04934694990515709, "optim/lr": 1.904859875740694e-05, "optim/total_tokens": 1959838875648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2757750749588013, "created_at": "2025-06-03T06:39:16.197754+00:00"} {"global_step": 233632, "acc_step": 0, "speed/wps": 5521.250503299583, "speed/FLOPS": 244011011923905.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04446783289313316, "optim/lr": 1.904505153231262e-05, "optim/total_tokens": 1959847264256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2939200401306152, "created_at": "2025-06-03T06:39:19.169249+00:00"} {"global_step": 233633, "acc_step": 0, "speed/wps": 5520.642804239778, "speed/FLOPS": 243984154735947.84, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0502251461148262, "optim/lr": 1.9041504307218072e-05, "optim/total_tokens": 1959855652864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2760504484176636, "created_at": "2025-06-03T06:39:22.140404+00:00"} {"global_step": 233634, "acc_step": 0, "speed/wps": 5509.18782477071, "speed/FLOPS": 243477903275315.06, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044162116944789886, "optim/lr": 1.9037957082123526e-05, "optim/total_tokens": 1959864041472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2854480743408203, "created_at": "2025-06-03T06:39:25.117581+00:00"} {"global_step": 233635, "acc_step": 0, "speed/wps": 5523.864717744759, "speed/FLOPS": 244126546821619.72, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.049992095679044724, "optim/lr": 1.90344098570292e-05, "optim/total_tokens": 1959872430080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2927604913711548, "created_at": "2025-06-03T06:39:28.086789+00:00"} {"global_step": 233636, "acc_step": 0, "speed/wps": 5509.802189181585, "speed/FLOPS": 243505055037673.62, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.43 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.43, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04354334995150566, "optim/lr": 1.9030862631934653e-05, "optim/total_tokens": 1959880818688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2764557600021362, "created_at": "2025-06-03T06:39:31.065307+00:00"} {"global_step": 233637, "acc_step": 0, "speed/wps": 5522.444929526097, "speed/FLOPS": 244063799449489.75, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04488489776849747, "optim/lr": 1.9027315406840107e-05, "optim/total_tokens": 1959889207296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2736226320266724, "created_at": "2025-06-03T06:39:34.036900+00:00"} {"global_step": 233638, "acc_step": 0, "speed/wps": 5518.568907815575, "speed/FLOPS": 243892499129162.22, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04387989267706871, "optim/lr": 1.902376818174556e-05, "optim/total_tokens": 1959897595904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2804903984069824, "created_at": "2025-06-03T06:39:37.012845+00:00"} {"global_step": 233639, "acc_step": 0, "speed/wps": 5517.07655619672, "speed/FLOPS": 243826544826156.88, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04502975568175316, "optim/lr": 1.9020220956651234e-05, "optim/total_tokens": 1959905984512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.293379783630371, "created_at": "2025-06-03T06:39:39.986024+00:00"} {"global_step": 233640, "acc_step": 0, "speed/wps": 5514.802683876488, "speed/FLOPS": 243726051308336.25, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04334636777639389, "optim/lr": 1.9016673731556688e-05, "optim/total_tokens": 1959914373120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2823820114135742, "created_at": "2025-06-03T06:39:42.965974+00:00"} {"global_step": 233641, "acc_step": 0, "speed/wps": 5513.742535160573, "speed/FLOPS": 243679198161425.84, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043512631207704544, "optim/lr": 1.901312650646214e-05, "optim/total_tokens": 1959922761728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2926931381225586, "created_at": "2025-06-03T06:39:45.944947+00:00"} {"global_step": 233642, "acc_step": 0, "speed/wps": 5513.285468810309, "speed/FLOPS": 243658998168221.8, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043022967875003815, "optim/lr": 1.9009579281367595e-05, "optim/total_tokens": 1959931150336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2783637046813965, "created_at": "2025-06-03T06:39:48.923904+00:00"} {"global_step": 233643, "acc_step": 0, "speed/wps": 5527.169176964573, "speed/FLOPS": 244272587005379.94, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04560968279838562, "optim/lr": 1.900603205627327e-05, "optim/total_tokens": 1959939538944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2852656841278076, "created_at": "2025-06-03T06:39:51.895353+00:00"} {"global_step": 233644, "acc_step": 0, "speed/wps": 5521.922173121328, "speed/FLOPS": 244040696292108.78, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045135289430618286, "optim/lr": 1.9002484831178723e-05, "optim/total_tokens": 1959947927552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2729636430740356, "created_at": "2025-06-03T06:39:54.866084+00:00"} {"global_step": 233645, "acc_step": 0, "speed/wps": 5526.914516322364, "speed/FLOPS": 244261332308465.6, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04488588124513626, "optim/lr": 1.8998937606084176e-05, "optim/total_tokens": 1959956316160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2972424030303955, "created_at": "2025-06-03T06:39:57.834002+00:00"} {"global_step": 233646, "acc_step": 0, "speed/wps": 5508.076932331688, "speed/FLOPS": 243428807515573.25, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04334040731191635, "optim/lr": 1.899539038098963e-05, "optim/total_tokens": 1959964704768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2883508205413818, "created_at": "2025-06-03T06:40:00.815878+00:00"} {"global_step": 233647, "acc_step": 0, "speed/wps": 5514.640705249961, "speed/FLOPS": 243718892682125.5, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04559389874339104, "optim/lr": 1.8991843155895307e-05, "optim/total_tokens": 1959973093376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2860448360443115, "created_at": "2025-06-03T06:40:03.795036+00:00"} {"global_step": 233648, "acc_step": 0, "speed/wps": 5514.2987425345345, "speed/FLOPS": 243703779680427.53, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04464751482009888, "optim/lr": 1.8988295930800757e-05, "optim/total_tokens": 1959981481984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2654426097869873, "created_at": "2025-06-03T06:40:06.771817+00:00"} {"global_step": 233649, "acc_step": 0, "speed/wps": 5505.0090477740105, "speed/FLOPS": 243293222720980.56, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.42 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.42, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04858145862817764, "optim/lr": 1.898474870570621e-05, "optim/total_tokens": 1959989870592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2707319259643555, "created_at": "2025-06-03T06:40:09.755666+00:00"} {"global_step": 233650, "acc_step": 0, "speed/wps": 5514.574643666595, "speed/FLOPS": 243715973098274.56, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045760657638311386, "optim/lr": 1.8981201480611664e-05, "optim/total_tokens": 1959998259200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3000833988189697, "created_at": "2025-06-03T06:40:12.732808+00:00"} {"global_step": 233651, "acc_step": 0, "speed/wps": 5530.05944442612, "speed/FLOPS": 244400322033450.34, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05286908894777298, "optim/lr": 1.897765425551734e-05, "optim/total_tokens": 1960006647808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2629659175872803, "created_at": "2025-06-03T06:40:15.702903+00:00"} {"global_step": 233652, "acc_step": 0, "speed/wps": 5528.313810123154, "speed/FLOPS": 244323173932225.6, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0439642108976841, "optim/lr": 1.8974107030422795e-05, "optim/total_tokens": 1960015036416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2726600170135498, "created_at": "2025-06-03T06:40:18.673561+00:00"} {"global_step": 233653, "acc_step": 0, "speed/wps": 5528.335672361289, "speed/FLOPS": 244324140131250.06, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04869140312075615, "optim/lr": 1.8970559805328245e-05, "optim/total_tokens": 1960023425024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.28525710105896, "created_at": "2025-06-03T06:40:21.645799+00:00"} {"global_step": 233654, "acc_step": 0, "speed/wps": 5523.239171235851, "speed/FLOPS": 244098900867763.25, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045267362147569656, "optim/lr": 1.89670125802337e-05, "optim/total_tokens": 1960031813632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2831978797912598, "created_at": "2025-06-03T06:40:24.619352+00:00"} {"global_step": 233655, "acc_step": 0, "speed/wps": 5520.156823836757, "speed/FLOPS": 243962676889607.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04735178500413895, "optim/lr": 1.8963465355139376e-05, "optim/total_tokens": 1960040202240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2854523658752441, "created_at": "2025-06-03T06:40:27.593795+00:00"} {"global_step": 233656, "acc_step": 0, "speed/wps": 5517.550284451812, "speed/FLOPS": 243847481190270.94, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04821353405714035, "optim/lr": 1.895991813004483e-05, "optim/total_tokens": 1960048590848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2747786045074463, "created_at": "2025-06-03T06:40:30.566978+00:00"} {"global_step": 233657, "acc_step": 0, "speed/wps": 5508.374813575377, "speed/FLOPS": 243441972341849.84, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04604196548461914, "optim/lr": 1.8956370904950284e-05, "optim/total_tokens": 1960056979456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.292292594909668, "created_at": "2025-06-03T06:40:33.548477+00:00"} {"global_step": 233658, "acc_step": 0, "speed/wps": 5504.938998952139, "speed/FLOPS": 243290126921596.2, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04730639606714249, "optim/lr": 1.8952823679855734e-05, "optim/total_tokens": 1960065368064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2763590812683105, "created_at": "2025-06-03T06:40:36.528176+00:00"} {"global_step": 233659, "acc_step": 0, "speed/wps": 5506.363938890862, "speed/FLOPS": 243353101973384.0, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.41 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.41, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04353160783648491, "optim/lr": 1.894927645476141e-05, "optim/total_tokens": 1960073756672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2911063432693481, "created_at": "2025-06-03T06:40:39.507027+00:00"} {"global_step": 233660, "acc_step": 0, "speed/wps": 5529.9539662129355, "speed/FLOPS": 244395660436314.03, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04812149703502655, "optim/lr": 1.8945729229666865e-05, "optim/total_tokens": 1960082145280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2789500951766968, "created_at": "2025-06-03T06:40:42.473514+00:00"} {"global_step": 233661, "acc_step": 0, "speed/wps": 5538.0140453660215, "speed/FLOPS": 244751874679655.44, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04434515908360481, "optim/lr": 1.8942182004572318e-05, "optim/total_tokens": 1960090533888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2941877841949463, "created_at": "2025-06-03T06:40:45.435226+00:00"} {"global_step": 233662, "acc_step": 0, "speed/wps": 5514.801921051685, "speed/FLOPS": 243726017595384.44, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.049213483929634094, "optim/lr": 1.8938634779477992e-05, "optim/total_tokens": 1960098922496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2714229822158813, "created_at": "2025-06-03T06:40:48.409862+00:00"} {"global_step": 233663, "acc_step": 0, "speed/wps": 5519.013778804175, "speed/FLOPS": 243912160149802.22, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045938290655612946, "optim/lr": 1.8935087554383446e-05, "optim/total_tokens": 1960107311104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.3015401363372803, "created_at": "2025-06-03T06:40:51.382000+00:00"} {"global_step": 233664, "acc_step": 0, "speed/wps": 5524.013655312802, "speed/FLOPS": 244133129099795.62, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04582187533378601, "optim/lr": 1.89315403292889e-05, "optim/total_tokens": 1960115699712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2992725372314453, "created_at": "2025-06-03T06:40:54.351350+00:00"} {"global_step": 233665, "acc_step": 0, "speed/wps": 5515.675257201231, "speed/FLOPS": 243764614583054.75, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04732922837138176, "optim/lr": 1.8927993104194353e-05, "optim/total_tokens": 1960124088320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2929675579071045, "created_at": "2025-06-03T06:40:57.325646+00:00"} {"global_step": 233666, "acc_step": 0, "speed/wps": 5519.765084412486, "speed/FLOPS": 243945364012158.88, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04470234364271164, "optim/lr": 1.8924445879100027e-05, "optim/total_tokens": 1960132476928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.290779948234558, "created_at": "2025-06-03T06:41:00.299112+00:00"} {"global_step": 233667, "acc_step": 0, "speed/wps": 5510.682522447745, "speed/FLOPS": 243543961262083.75, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05321316421031952, "optim/lr": 1.892089865400548e-05, "optim/total_tokens": 1960140865536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2872384786605835, "created_at": "2025-06-03T06:41:03.276468+00:00"} {"global_step": 233668, "acc_step": 0, "speed/wps": 5525.098684774893, "speed/FLOPS": 244181081848335.78, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045438848435878754, "optim/lr": 1.8917351428910934e-05, "optim/total_tokens": 1960149254144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2764776945114136, "created_at": "2025-06-03T06:41:06.248651+00:00"} {"global_step": 233669, "acc_step": 0, "speed/wps": 5529.6745834700705, "speed/FLOPS": 244383313149089.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05477476119995117, "optim/lr": 1.8913804203816387e-05, "optim/total_tokens": 1960157642752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2787245512008667, "created_at": "2025-06-03T06:41:09.214988+00:00"} {"global_step": 233670, "acc_step": 0, "speed/wps": 5519.572560769083, "speed/FLOPS": 243936855452545.78, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043748944997787476, "optim/lr": 1.891025697872206e-05, "optim/total_tokens": 1960166031360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2735284566879272, "created_at": "2025-06-03T06:41:12.186202+00:00"} {"global_step": 233671, "acc_step": 0, "speed/wps": 5516.9317766579925, "speed/FLOPS": 243820146311594.0, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.054286807775497437, "optim/lr": 1.8906709753627515e-05, "optim/total_tokens": 1960174419968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2952830791473389, "created_at": "2025-06-03T06:41:15.164103+00:00"} {"global_step": 233672, "acc_step": 0, "speed/wps": 5513.919335844934, "speed/FLOPS": 243687011846726.66, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04406638815999031, "optim/lr": 1.890316252853297e-05, "optim/total_tokens": 1960182808576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2863290309906006, "created_at": "2025-06-03T06:41:18.138518+00:00"} {"global_step": 233673, "acc_step": 0, "speed/wps": 5513.357506895221, "speed/FLOPS": 243662181882850.62, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0484626479446888, "optim/lr": 1.8899615303438422e-05, "optim/total_tokens": 1960191197184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2735366821289062, "created_at": "2025-06-03T06:41:21.113650+00:00"} {"global_step": 233674, "acc_step": 0, "speed/wps": 5503.272908585667, "speed/FLOPS": 243216494255221.72, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.4 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.4, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04759030416607857, "optim/lr": 1.8896068078344096e-05, "optim/total_tokens": 1960199585792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2964184284210205, "created_at": "2025-06-03T06:41:24.097642+00:00"} {"global_step": 233675, "acc_step": 0, "speed/wps": 5517.699647925588, "speed/FLOPS": 243854082291300.25, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0437164343893528, "optim/lr": 1.889252085324955e-05, "optim/total_tokens": 1960207974400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2786542177200317, "created_at": "2025-06-03T06:41:27.070149+00:00"} {"global_step": 233676, "acc_step": 0, "speed/wps": 5526.667427388329, "speed/FLOPS": 244250412242297.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.049274370074272156, "optim/lr": 1.8888973628155003e-05, "optim/total_tokens": 1960216363008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2885206937789917, "created_at": "2025-06-03T06:41:30.039837+00:00"} {"global_step": 233677, "acc_step": 0, "speed/wps": 5525.412280048074, "speed/FLOPS": 244194941154284.28, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0436101034283638, "optim/lr": 1.8885426403060457e-05, "optim/total_tokens": 1960224751616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.278583288192749, "created_at": "2025-06-03T06:41:33.011567+00:00"} {"global_step": 233678, "acc_step": 0, "speed/wps": 5520.654575363286, "speed/FLOPS": 243984674959356.8, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04965239390730858, "optim/lr": 1.8881879177966134e-05, "optim/total_tokens": 1960233140224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2779544591903687, "created_at": "2025-06-03T06:41:35.982496+00:00"} {"global_step": 233679, "acc_step": 0, "speed/wps": 5523.773235619386, "speed/FLOPS": 244122503779926.16, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0442175418138504, "optim/lr": 1.8878331952871584e-05, "optim/total_tokens": 1960241528832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.287082314491272, "created_at": "2025-06-03T06:41:38.951660+00:00"} {"global_step": 233680, "acc_step": 0, "speed/wps": 5535.873802365796, "speed/FLOPS": 244657286893802.25, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04814217612147331, "optim/lr": 1.8874784727777038e-05, "optim/total_tokens": 1960249917440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2914050817489624, "created_at": "2025-06-03T06:41:41.918225+00:00"} {"global_step": 233681, "acc_step": 0, "speed/wps": 5525.566338471924, "speed/FLOPS": 244201749748075.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04281776025891304, "optim/lr": 1.887123750268249e-05, "optim/total_tokens": 1960258306048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.284533977508545, "created_at": "2025-06-03T06:41:44.886994+00:00"} {"global_step": 233682, "acc_step": 0, "speed/wps": 5506.739589469198, "speed/FLOPS": 243369703806192.47, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04345370829105377, "optim/lr": 1.886769027758817e-05, "optim/total_tokens": 1960266694656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2773115634918213, "created_at": "2025-06-03T06:41:47.865165+00:00"} {"global_step": 233683, "acc_step": 0, "speed/wps": 5514.116049328163, "speed/FLOPS": 243695705575814.5, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043830785900354385, "optim/lr": 1.8864143052493622e-05, "optim/total_tokens": 1960275083264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2802963256835938, "created_at": "2025-06-03T06:41:50.840266+00:00"} {"global_step": 233684, "acc_step": 0, "speed/wps": 5527.018085299519, "speed/FLOPS": 244265909527141.78, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0470539852976799, "optim/lr": 1.8860595827399072e-05, "optim/total_tokens": 1960283471872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.3038333654403687, "created_at": "2025-06-03T06:41:53.808261+00:00"} {"global_step": 233685, "acc_step": 0, "speed/wps": 5523.612930884741, "speed/FLOPS": 244115419131168.9, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044036950916051865, "optim/lr": 1.8857048602304526e-05, "optim/total_tokens": 1960291860480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.286723017692566, "created_at": "2025-06-03T06:41:56.777677+00:00"} {"global_step": 233686, "acc_step": 0, "speed/wps": 5511.088472466282, "speed/FLOPS": 243561902175062.53, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.39 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.39, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0433722622692585, "optim/lr": 1.8853501377210203e-05, "optim/total_tokens": 1960300249088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.294283151626587, "created_at": "2025-06-03T06:41:59.758806+00:00"} {"global_step": 233687, "acc_step": 0, "speed/wps": 5531.764897921186, "speed/FLOPS": 244475694348629.97, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04362601041793823, "optim/lr": 1.8849954152115657e-05, "optim/total_tokens": 1960308637696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2900800704956055, "created_at": "2025-06-03T06:42:02.723966+00:00"} {"global_step": 233688, "acc_step": 0, "speed/wps": 5518.604801583393, "speed/FLOPS": 243894085449978.84, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04343229532241821, "optim/lr": 1.884640692702111e-05, "optim/total_tokens": 1960317026304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2801839113235474, "created_at": "2025-06-03T06:42:05.697434+00:00"} {"global_step": 233689, "acc_step": 0, "speed/wps": 5511.6122760992785, "speed/FLOPS": 243585051614570.94, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0451233871281147, "optim/lr": 1.8842859701926784e-05, "optim/total_tokens": 1960325414912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2848179340362549, "created_at": "2025-06-03T06:42:08.673753+00:00"} {"global_step": 233690, "acc_step": 0, "speed/wps": 5515.897681629072, "speed/FLOPS": 243774444604293.9, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04469955340027809, "optim/lr": 1.8839312476832238e-05, "optim/total_tokens": 1960333803520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2845488786697388, "created_at": "2025-06-03T06:42:11.648245+00:00"} {"global_step": 233691, "acc_step": 0, "speed/wps": 5527.05075156588, "speed/FLOPS": 244267353208913.84, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044056668877601624, "optim/lr": 1.883576525173769e-05, "optim/total_tokens": 1960342192128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.3014036417007446, "created_at": "2025-06-03T06:42:14.618398+00:00"} {"global_step": 233692, "acc_step": 0, "speed/wps": 5515.836174641314, "speed/FLOPS": 243771726310256.28, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05400466546416283, "optim/lr": 1.8832218026643145e-05, "optim/total_tokens": 1960350580736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2788597345352173, "created_at": "2025-06-03T06:42:17.593411+00:00"} {"global_step": 233693, "acc_step": 0, "speed/wps": 5525.0623659464645, "speed/FLOPS": 244179476742015.88, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04403569921851158, "optim/lr": 1.882867080154882e-05, "optim/total_tokens": 1960358969344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2922371625900269, "created_at": "2025-06-03T06:42:20.562120+00:00"} {"global_step": 233694, "acc_step": 0, "speed/wps": 5527.266730762903, "speed/FLOPS": 244276898383940.5, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05010456219315529, "optim/lr": 1.8825123576454273e-05, "optim/total_tokens": 1960367357952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3012350797653198, "created_at": "2025-06-03T06:42:23.529384+00:00"} {"global_step": 233695, "acc_step": 0, "speed/wps": 5507.10674174388, "speed/FLOPS": 243385930057477.72, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044598229229450226, "optim/lr": 1.8821576351359726e-05, "optim/total_tokens": 1960375746560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2710455656051636, "created_at": "2025-06-03T06:42:26.507458+00:00"} {"global_step": 233696, "acc_step": 0, "speed/wps": 5517.429673504519, "speed/FLOPS": 243842150803743.38, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05211792141199112, "optim/lr": 1.881802912626518e-05, "optim/total_tokens": 1960384135168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2990806102752686, "created_at": "2025-06-03T06:42:29.481014+00:00"} {"global_step": 233697, "acc_step": 0, "speed/wps": 5512.376428663158, "speed/FLOPS": 243618823246607.0, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044613420963287354, "optim/lr": 1.8814481901170854e-05, "optim/total_tokens": 1960392523776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2714399099349976, "created_at": "2025-06-03T06:42:32.459677+00:00"} {"global_step": 233698, "acc_step": 0, "speed/wps": 5525.814849423959, "speed/FLOPS": 244212732660161.53, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.051977936178445816, "optim/lr": 1.8810934676076307e-05, "optim/total_tokens": 1960400912384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2993760108947754, "created_at": "2025-06-03T06:42:35.430544+00:00"} {"global_step": 233699, "acc_step": 0, "speed/wps": 5512.538142588874, "speed/FLOPS": 243625970174396.75, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04442737251520157, "optim/lr": 1.880738745098176e-05, "optim/total_tokens": 1960409300992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2747859954833984, "created_at": "2025-06-03T06:42:38.406481+00:00"} {"global_step": 233700, "acc_step": 0, "speed/wps": 5503.732540788962, "speed/FLOPS": 243236807645996.47, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.38 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.38, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05266667529940605, "optim/lr": 1.8803840225887214e-05, "optim/total_tokens": 1960417689600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2871686220169067, "created_at": "2025-06-03T06:42:41.390203+00:00"} {"global_step": 233701, "acc_step": 0, "speed/wps": 5526.3824280421195, "speed/FLOPS": 244237816729953.53, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04398659989237785, "optim/lr": 1.880029300079289e-05, "optim/total_tokens": 1960426078208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.294297218322754, "created_at": "2025-06-03T06:42:44.361344+00:00"} {"global_step": 233702, "acc_step": 0, "speed/wps": 5529.23440528331, "speed/FLOPS": 244363859526271.28, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04528236761689186, "optim/lr": 1.8796745775698342e-05, "optim/total_tokens": 1960434466816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2941609621047974, "created_at": "2025-06-03T06:42:47.328559+00:00"} {"global_step": 233703, "acc_step": 0, "speed/wps": 5514.380660495485, "speed/FLOPS": 243707400035007.4, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04504593834280968, "optim/lr": 1.8793198550603796e-05, "optim/total_tokens": 1960442855424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2961382865905762, "created_at": "2025-06-03T06:42:50.302653+00:00"} {"global_step": 233704, "acc_step": 0, "speed/wps": 5525.896371775812, "speed/FLOPS": 244216335530844.25, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.047377824783325195, "optim/lr": 1.878965132550925e-05, "optim/total_tokens": 1960451244032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.282064437866211, "created_at": "2025-06-03T06:42:53.274824+00:00"} {"global_step": 233705, "acc_step": 0, "speed/wps": 5529.194995660849, "speed/FLOPS": 244362117822675.25, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04339437931776047, "optim/lr": 1.8786104100414926e-05, "optim/total_tokens": 1960459632640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2940170764923096, "created_at": "2025-06-03T06:42:56.241610+00:00"} {"global_step": 233706, "acc_step": 0, "speed/wps": 5534.4440753784975, "speed/FLOPS": 244594100278969.75, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.1, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04608231782913208, "optim/lr": 1.8782556875320377e-05, "optim/total_tokens": 1960468021248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3058395385742188, "created_at": "2025-06-03T06:42:59.205264+00:00"} {"global_step": 233707, "acc_step": 0, "speed/wps": 5519.107607502729, "speed/FLOPS": 243916306898019.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04542408138513565, "optim/lr": 1.877900965022583e-05, "optim/total_tokens": 1960476409856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2803887128829956, "created_at": "2025-06-03T06:43:02.177315+00:00"} {"global_step": 233708, "acc_step": 0, "speed/wps": 5508.744858530226, "speed/FLOPS": 243458326434792.44, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.37 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.37, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044035617262125015, "optim/lr": 1.8775462425131284e-05, "optim/total_tokens": 1960484798464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2869408130645752, "created_at": "2025-06-03T06:43:05.154659+00:00"} {"global_step": 233709, "acc_step": 0, "speed/wps": 5514.209651936554, "speed/FLOPS": 243699842332003.8, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043927956372499466, "optim/lr": 1.877191520003696e-05, "optim/total_tokens": 1960493187072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2860125303268433, "created_at": "2025-06-03T06:43:08.132869+00:00"} {"global_step": 233710, "acc_step": 0, "speed/wps": 5525.033896771417, "speed/FLOPS": 244178218550197.22, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04990606755018234, "optim/lr": 1.8768367974942415e-05, "optim/total_tokens": 1960501575680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.269200325012207, "created_at": "2025-06-03T06:43:11.102458+00:00"} {"global_step": 233711, "acc_step": 0, "speed/wps": 5523.081200649768, "speed/FLOPS": 244091919376425.16, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04300495609641075, "optim/lr": 1.8764820749847865e-05, "optim/total_tokens": 1960509964288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2768948078155518, "created_at": "2025-06-03T06:43:14.073240+00:00"} {"global_step": 233712, "acc_step": 0, "speed/wps": 5520.728767339913, "speed/FLOPS": 243987953864974.78, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04990174248814583, "optim/lr": 1.876127352475332e-05, "optim/total_tokens": 1960518352896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2818230390548706, "created_at": "2025-06-03T06:43:17.044826+00:00"} {"global_step": 233713, "acc_step": 0, "speed/wps": 5517.63134421467, "speed/FLOPS": 243851063616887.78, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04343418776988983, "optim/lr": 1.8757726299658996e-05, "optim/total_tokens": 1960526741504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2835750579833984, "created_at": "2025-06-03T06:43:20.018307+00:00"} {"global_step": 233714, "acc_step": 0, "speed/wps": 5520.1501152661995, "speed/FLOPS": 243962380405126.44, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04392084851861, "optim/lr": 1.875417907456445e-05, "optim/total_tokens": 1960535130112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.284772515296936, "created_at": "2025-06-03T06:43:22.992492+00:00"} {"global_step": 233715, "acc_step": 0, "speed/wps": 5513.316243804151, "speed/FLOPS": 243660358265428.94, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.048995573073625565, "optim/lr": 1.8750631849469903e-05, "optim/total_tokens": 1960543518720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2755143642425537, "created_at": "2025-06-03T06:43:25.972179+00:00"} {"global_step": 233716, "acc_step": 0, "speed/wps": 5528.766933263258, "speed/FLOPS": 244343199655723.7, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04651602730154991, "optim/lr": 1.8747084624375577e-05, "optim/total_tokens": 1960551907328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.278078317642212, "created_at": "2025-06-03T06:43:28.942164+00:00"} {"global_step": 233717, "acc_step": 0, "speed/wps": 5518.85778071534, "speed/FLOPS": 243905265832746.3, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046344734728336334, "optim/lr": 1.874353739928103e-05, "optim/total_tokens": 1960560295936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2657630443572998, "created_at": "2025-06-03T06:43:31.913990+00:00"} {"global_step": 233718, "acc_step": 0, "speed/wps": 5522.364848993794, "speed/FLOPS": 244060260299851.25, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04585703834891319, "optim/lr": 1.8739990174186484e-05, "optim/total_tokens": 1960568684544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2860209941864014, "created_at": "2025-06-03T06:43:34.886566+00:00"} {"global_step": 233719, "acc_step": 0, "speed/wps": 5526.16778906996, "speed/FLOPS": 244228330786005.94, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04464827850461006, "optim/lr": 1.8736442949091938e-05, "optim/total_tokens": 1960577073152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2730573415756226, "created_at": "2025-06-03T06:43:37.854366+00:00"} {"global_step": 233720, "acc_step": 0, "speed/wps": 5526.3925913275825, "speed/FLOPS": 244238265895150.56, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04450574889779091, "optim/lr": 1.873289572399761e-05, "optim/total_tokens": 1960585461760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2789316177368164, "created_at": "2025-06-03T06:43:40.824088+00:00"} {"global_step": 233721, "acc_step": 0, "speed/wps": 5518.129273012958, "speed/FLOPS": 243873069521141.47, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045560844242572784, "optim/lr": 1.8729348498903065e-05, "optim/total_tokens": 1960593850368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2846356630325317, "created_at": "2025-06-03T06:43:43.796604+00:00"} {"global_step": 233722, "acc_step": 0, "speed/wps": 5527.548526215278, "speed/FLOPS": 244289352300575.6, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04672347009181976, "optim/lr": 1.872580127380852e-05, "optim/total_tokens": 1960602238976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2832634449005127, "created_at": "2025-06-03T06:43:46.763795+00:00"} {"global_step": 233723, "acc_step": 0, "speed/wps": 5520.263602814219, "speed/FLOPS": 243967395973866.97, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04833744093775749, "optim/lr": 1.8722254048713972e-05, "optim/total_tokens": 1960610627584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2948482036590576, "created_at": "2025-06-03T06:43:49.736213+00:00"} {"global_step": 233724, "acc_step": 0, "speed/wps": 5507.8037127470325, "speed/FLOPS": 243416732608396.06, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044548533856868744, "optim/lr": 1.8718706823619646e-05, "optim/total_tokens": 1960619016192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.287973165512085, "created_at": "2025-06-03T06:43:52.719287+00:00"} {"global_step": 233725, "acc_step": 0, "speed/wps": 5505.931930950694, "speed/FLOPS": 243334009433645.62, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.36 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.36, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046847667545080185, "optim/lr": 1.87151595985251e-05, "optim/total_tokens": 1960627404800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2951676845550537, "created_at": "2025-06-03T06:43:55.698611+00:00"} {"global_step": 233726, "acc_step": 0, "speed/wps": 5534.526898117434, "speed/FLOPS": 244597760620105.53, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04316860809922218, "optim/lr": 1.8711612373430553e-05, "optim/total_tokens": 1960635793408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2849241495132446, "created_at": "2025-06-03T06:43:58.662429+00:00"} {"global_step": 233727, "acc_step": 0, "speed/wps": 5526.592484974231, "speed/FLOPS": 244247100171184.03, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043851159512996674, "optim/lr": 1.8708065148336007e-05, "optim/total_tokens": 1960644182016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2835372686386108, "created_at": "2025-06-03T06:44:01.633842+00:00"} {"global_step": 233728, "acc_step": 0, "speed/wps": 5516.106981171024, "speed/FLOPS": 243783694572756.0, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04483983665704727, "optim/lr": 1.870451792324168e-05, "optim/total_tokens": 1960652570624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2821722030639648, "created_at": "2025-06-03T06:44:04.606779+00:00"} {"global_step": 233729, "acc_step": 0, "speed/wps": 5517.037526017589, "speed/FLOPS": 243824819892013.84, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04387843236327171, "optim/lr": 1.8700970698147134e-05, "optim/total_tokens": 1960660959232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2949559688568115, "created_at": "2025-06-03T06:44:07.579950+00:00"} {"global_step": 233730, "acc_step": 0, "speed/wps": 5520.7661233047, "speed/FLOPS": 243989604807413.2, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04492850601673126, "optim/lr": 1.8697423473052588e-05, "optim/total_tokens": 1960669347840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.289107322692871, "created_at": "2025-06-03T06:44:10.551100+00:00"} {"global_step": 233731, "acc_step": 0, "speed/wps": 5520.586846396291, "speed/FLOPS": 243981681685683.9, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046264540404081345, "optim/lr": 1.869387624795804e-05, "optim/total_tokens": 1960677736448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2873681783676147, "created_at": "2025-06-03T06:44:13.522309+00:00"} {"global_step": 233732, "acc_step": 0, "speed/wps": 5517.03841619694, "speed/FLOPS": 243824859233384.8, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044191014021635056, "optim/lr": 1.8690329022863715e-05, "optim/total_tokens": 1960686125056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2738550901412964, "created_at": "2025-06-03T06:44:16.495434+00:00"} {"global_step": 233733, "acc_step": 0, "speed/wps": 5506.8888547533425, "speed/FLOPS": 243376300567742.7, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04485245794057846, "optim/lr": 1.868678179776917e-05, "optim/total_tokens": 1960694513664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.292359709739685, "created_at": "2025-06-03T06:44:19.476588+00:00"} {"global_step": 233734, "acc_step": 0, "speed/wps": 5505.858047398244, "speed/FLOPS": 243330744158797.66, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.35 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.35, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04297330603003502, "optim/lr": 1.8683234572674623e-05, "optim/total_tokens": 1960702902272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.3058712482452393, "created_at": "2025-06-03T06:44:22.460361+00:00"} {"global_step": 233735, "acc_step": 0, "speed/wps": 5528.543217835835, "speed/FLOPS": 244333312578910.97, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.042999956756830215, "optim/lr": 1.8679687347580076e-05, "optim/total_tokens": 1960711290880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.298069953918457, "created_at": "2025-06-03T06:44:25.427889+00:00"} {"global_step": 233736, "acc_step": 0, "speed/wps": 5528.922495949047, "speed/FLOPS": 244350074730193.56, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04470759630203247, "optim/lr": 1.8676140122485753e-05, "optim/total_tokens": 1960719679488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2848138809204102, "created_at": "2025-06-03T06:44:28.394191+00:00"} {"global_step": 233737, "acc_step": 0, "speed/wps": 5520.905769018684, "speed/FLOPS": 243995776433199.72, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04434174671769142, "optim/lr": 1.8672592897391204e-05, "optim/total_tokens": 1960728068096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2801522016525269, "created_at": "2025-06-03T06:44:31.367670+00:00"} {"global_step": 233738, "acc_step": 0, "speed/wps": 5532.399901993151, "speed/FLOPS": 244503758278365.3, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.19, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04914199188351631, "optim/lr": 1.8669045672296657e-05, "optim/total_tokens": 1960736456704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2880767583847046, "created_at": "2025-06-03T06:44:34.335570+00:00"} {"global_step": 233739, "acc_step": 0, "speed/wps": 5524.484122306258, "speed/FLOPS": 244153921332838.0, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045673683285713196, "optim/lr": 1.866549844720211e-05, "optim/total_tokens": 1960744845312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.28822922706604, "created_at": "2025-06-03T06:44:37.304675+00:00"} {"global_step": 233740, "acc_step": 0, "speed/wps": 5526.358096983914, "speed/FLOPS": 244236741421718.47, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0473758727312088, "optim/lr": 1.8661951222107788e-05, "optim/total_tokens": 1960753233920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2874244451522827, "created_at": "2025-06-03T06:44:40.272836+00:00"} {"global_step": 233741, "acc_step": 0, "speed/wps": 5518.689836482074, "speed/FLOPS": 243897843557252.47, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04838332533836365, "optim/lr": 1.865840399701324e-05, "optim/total_tokens": 1960761622528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2881380319595337, "created_at": "2025-06-03T06:44:43.245132+00:00"} {"global_step": 233742, "acc_step": 0, "speed/wps": 5512.687994467433, "speed/FLOPS": 243632592860417.62, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.34 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.34, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04662157595157623, "optim/lr": 1.8654856771918692e-05, "optim/total_tokens": 1960770011136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2943952083587646, "created_at": "2025-06-03T06:44:46.220190+00:00"} {"global_step": 233743, "acc_step": 0, "speed/wps": 5524.7516128872185, "speed/FLOPS": 244165743047375.56, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04802122339606285, "optim/lr": 1.865130954682437e-05, "optim/total_tokens": 1960778399744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2796802520751953, "created_at": "2025-06-03T06:44:49.189328+00:00"} {"global_step": 233744, "acc_step": 0, "speed/wps": 5527.49872226814, "speed/FLOPS": 244287151221031.8, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.31, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04673287644982338, "optim/lr": 1.8647762321729823e-05, "optim/total_tokens": 1960786788352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2820338010787964, "created_at": "2025-06-03T06:44:52.158013+00:00"} {"global_step": 233745, "acc_step": 0, "speed/wps": 5524.611817229122, "speed/FLOPS": 244159564794826.72, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04368218407034874, "optim/lr": 1.8644215096635276e-05, "optim/total_tokens": 1960795176960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2693955898284912, "created_at": "2025-06-03T06:44:55.126952+00:00"} {"global_step": 233746, "acc_step": 0, "speed/wps": 5523.3723726546, "speed/FLOPS": 244104787688685.3, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04487869143486023, "optim/lr": 1.864066787154073e-05, "optim/total_tokens": 1960803565568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2771015167236328, "created_at": "2025-06-03T06:44:58.096862+00:00"} {"global_step": 233747, "acc_step": 0, "speed/wps": 5538.625367081092, "speed/FLOPS": 244778891970433.38, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04492815211415291, "optim/lr": 1.8637120646446404e-05, "optim/total_tokens": 1960811954176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2880654335021973, "created_at": "2025-06-03T06:45:01.059533+00:00"} {"global_step": 233748, "acc_step": 0, "speed/wps": 5520.1892522886355, "speed/FLOPS": 243964110061196.66, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.047832220792770386, "optim/lr": 1.8633573421351857e-05, "optim/total_tokens": 1960820342784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2714282274246216, "created_at": "2025-06-03T06:45:04.033657+00:00"} {"global_step": 233749, "acc_step": 0, "speed/wps": 5514.1402398697255, "speed/FLOPS": 243696774673933.16, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04634398594498634, "optim/lr": 1.863002619625731e-05, "optim/total_tokens": 1960828731392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2787387371063232, "created_at": "2025-06-03T06:45:07.008335+00:00"} {"global_step": 233750, "acc_step": 0, "speed/wps": 5520.531201947773, "speed/FLOPS": 243979222485873.53, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04562753811478615, "optim/lr": 1.8626478971162765e-05, "optim/total_tokens": 1960837120000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2818611860275269, "created_at": "2025-06-03T06:45:09.981025+00:00"} {"global_step": 233751, "acc_step": 0, "speed/wps": 5512.625283342382, "speed/FLOPS": 243629821349675.03, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046526242047548294, "optim/lr": 1.862293174606844e-05, "optim/total_tokens": 1960845508608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2812877893447876, "created_at": "2025-06-03T06:45:12.957005+00:00"} {"global_step": 233752, "acc_step": 0, "speed/wps": 5538.870094433634, "speed/FLOPS": 244789707666787.6, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 191.99, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04373125731945038, "optim/lr": 1.8619384520973892e-05, "optim/total_tokens": 1960853897216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2828269004821777, "created_at": "2025-06-03T06:45:15.918285+00:00"} {"global_step": 233753, "acc_step": 0, "speed/wps": 5534.279646035986, "speed/FLOPS": 244586833343656.4, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045741498470306396, "optim/lr": 1.8615837295879346e-05, "optim/total_tokens": 1960862285824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2849743366241455, "created_at": "2025-06-03T06:45:18.883918+00:00"} {"global_step": 233754, "acc_step": 0, "speed/wps": 5525.891597182233, "speed/FLOPS": 244216124518246.62, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04534213989973068, "optim/lr": 1.86122900707848e-05, "optim/total_tokens": 1960870674432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.3075765371322632, "created_at": "2025-06-03T06:45:21.852165+00:00"} {"global_step": 233755, "acc_step": 0, "speed/wps": 5526.886300232235, "speed/FLOPS": 244260085301704.97, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046652667224407196, "optim/lr": 1.8608742845690473e-05, "optim/total_tokens": 1960879063040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2871203422546387, "created_at": "2025-06-03T06:45:24.819703+00:00"} {"global_step": 233756, "acc_step": 0, "speed/wps": 5515.5408704454785, "speed/FLOPS": 243758675376304.25, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.33 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.33, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044259704649448395, "optim/lr": 1.8605195620595927e-05, "optim/total_tokens": 1960887451648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2881674766540527, "created_at": "2025-06-03T06:45:27.798541+00:00"} {"global_step": 233757, "acc_step": 0, "speed/wps": 5517.388849091273, "speed/FLOPS": 243840346573636.2, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.67, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04376479238271713, "optim/lr": 1.860164839550138e-05, "optim/total_tokens": 1960895840256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2768120765686035, "created_at": "2025-06-03T06:45:30.773504+00:00"} {"global_step": 233758, "acc_step": 0, "speed/wps": 5523.15855743085, "speed/FLOPS": 244095338150201.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04625609144568443, "optim/lr": 1.8598101170406834e-05, "optim/total_tokens": 1960904228864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2832601070404053, "created_at": "2025-06-03T06:45:33.743187+00:00"} {"global_step": 233759, "acc_step": 0, "speed/wps": 5524.493657529787, "speed/FLOPS": 244154342740912.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0438997820019722, "optim/lr": 1.8594553945312508e-05, "optim/total_tokens": 1960912617472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2700272798538208, "created_at": "2025-06-03T06:45:36.712410+00:00"} {"global_step": 233760, "acc_step": 0, "speed/wps": 5523.399240539475, "speed/FLOPS": 244105975111674.47, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04618635028600693, "optim/lr": 1.859100672021796e-05, "optim/total_tokens": 1960921006080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.287902593612671, "created_at": "2025-06-03T06:45:39.682163+00:00"} {"global_step": 233761, "acc_step": 0, "speed/wps": 5520.981264207797, "speed/FLOPS": 243999112934139.1, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04458371922373772, "optim/lr": 1.8587459495123415e-05, "optim/total_tokens": 1960929394688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2960911989212036, "created_at": "2025-06-03T06:45:42.656715+00:00"} {"global_step": 233762, "acc_step": 0, "speed/wps": 5523.577690802571, "speed/FLOPS": 244113861699912.06, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045235056430101395, "optim/lr": 1.858391227002887e-05, "optim/total_tokens": 1960937783296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.270668387413025, "created_at": "2025-06-03T06:45:45.627298+00:00"} {"global_step": 233763, "acc_step": 0, "speed/wps": 5527.641723944909, "speed/FLOPS": 244293471163196.1, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043382685631513596, "optim/lr": 1.8580365044934546e-05, "optim/total_tokens": 1960946171904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.277857780456543, "created_at": "2025-06-03T06:45:48.598276+00:00"} {"global_step": 233764, "acc_step": 0, "speed/wps": 5514.457387843506, "speed/FLOPS": 243710790991063.75, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0433725081384182, "optim/lr": 1.8576817819839996e-05, "optim/total_tokens": 1960954560512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2782752513885498, "created_at": "2025-06-03T06:45:51.572731+00:00"} {"global_step": 233765, "acc_step": 0, "speed/wps": 5513.780063638007, "speed/FLOPS": 243680856728040.25, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04347563534975052, "optim/lr": 1.857327059474545e-05, "optim/total_tokens": 1960962949120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.274834156036377, "created_at": "2025-06-03T06:45:54.549011+00:00"} {"global_step": 233766, "acc_step": 0, "speed/wps": 5512.113213590589, "speed/FLOPS": 243607190487656.34, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046750083565711975, "optim/lr": 1.8569723369650903e-05, "optim/total_tokens": 1960971337728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2697746753692627, "created_at": "2025-06-03T06:45:57.524746+00:00"} {"global_step": 233767, "acc_step": 0, "speed/wps": 5510.73875224236, "speed/FLOPS": 243546446331195.53, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04456133767962456, "optim/lr": 1.856617614455658e-05, "optim/total_tokens": 1960979726336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2860071659088135, "created_at": "2025-06-03T06:46:00.500920+00:00"} {"global_step": 233768, "acc_step": 0, "speed/wps": 5524.97562886295, "speed/FLOPS": 244175643406885.16, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044526033103466034, "optim/lr": 1.8562628919462034e-05, "optim/total_tokens": 1960988114944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2785388231277466, "created_at": "2025-06-03T06:46:03.470319+00:00"} {"global_step": 233769, "acc_step": 0, "speed/wps": 5536.209681570625, "speed/FLOPS": 244672131035470.06, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.09, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04386354237794876, "optim/lr": 1.8559081694367484e-05, "optim/total_tokens": 1960996503552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2903205156326294, "created_at": "2025-06-03T06:46:06.433786+00:00"} {"global_step": 233770, "acc_step": 0, "speed/wps": 5519.842250041399, "speed/FLOPS": 243948774337987.3, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.67, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04372784495353699, "optim/lr": 1.8555534469272938e-05, "optim/total_tokens": 1961004892160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.276196002960205, "created_at": "2025-06-03T06:46:09.405406+00:00"} {"global_step": 233771, "acc_step": 0, "speed/wps": 5522.585447700648, "speed/FLOPS": 244070009633567.66, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04331139102578163, "optim/lr": 1.8551987244178615e-05, "optim/total_tokens": 1961013280768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2808150053024292, "created_at": "2025-06-03T06:46:12.375925+00:00"} {"global_step": 233772, "acc_step": 0, "speed/wps": 5522.381629143972, "speed/FLOPS": 244061001896600.5, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04675380513072014, "optim/lr": 1.854844001908407e-05, "optim/total_tokens": 1961021669376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2720147371292114, "created_at": "2025-06-03T06:46:15.347755+00:00"} {"global_step": 233773, "acc_step": 0, "speed/wps": 5517.788299254059, "speed/FLOPS": 243858000226260.06, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04323020949959755, "optim/lr": 1.8544892793989522e-05, "optim/total_tokens": 1961030057984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2838525772094727, "created_at": "2025-06-03T06:46:18.320774+00:00"} {"global_step": 233774, "acc_step": 0, "speed/wps": 5523.949615181042, "speed/FLOPS": 244130298853758.94, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.42, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04526390880346298, "optim/lr": 1.8541345568895196e-05, "optim/total_tokens": 1961038446592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2852503061294556, "created_at": "2025-06-03T06:46:21.291944+00:00"} {"global_step": 233775, "acc_step": 0, "speed/wps": 5509.653373751421, "speed/FLOPS": 243498478157366.78, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.31 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.31, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043776482343673706, "optim/lr": 1.853779834380065e-05, "optim/total_tokens": 1961046835200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.302485466003418, "created_at": "2025-06-03T06:46:24.270306+00:00"} {"global_step": 233776, "acc_step": 0, "speed/wps": 5506.714762696256, "speed/FLOPS": 243368606589903.38, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.32 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.32, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045196402817964554, "optim/lr": 1.8534251118706103e-05, "optim/total_tokens": 1961055223808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2900679111480713, "created_at": "2025-06-03T06:46:27.249269+00:00"} {"global_step": 233777, "acc_step": 0, "speed/wps": 5518.573420911002, "speed/FLOPS": 243892698584880.0, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0457550548017025, "optim/lr": 1.8530703893611557e-05, "optim/total_tokens": 1961063612416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.280813217163086, "created_at": "2025-06-03T06:46:30.224427+00:00"} {"global_step": 233778, "acc_step": 0, "speed/wps": 5521.195175135368, "speed/FLOPS": 244008566702242.38, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0454011894762516, "optim/lr": 1.852715666851723e-05, "optim/total_tokens": 1961072001024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2715973854064941, "created_at": "2025-06-03T06:46:33.196051+00:00"} {"global_step": 233779, "acc_step": 0, "speed/wps": 5532.823880221971, "speed/FLOPS": 244522495945961.88, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04409666359424591, "optim/lr": 1.8523609443422684e-05, "optim/total_tokens": 1961080389632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2750186920166016, "created_at": "2025-06-03T06:46:36.160755+00:00"} {"global_step": 233780, "acc_step": 0, "speed/wps": 5530.722468462685, "speed/FLOPS": 244429624302201.88, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04818602278828621, "optim/lr": 1.8520062218328138e-05, "optim/total_tokens": 1961088778240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2794369459152222, "created_at": "2025-06-03T06:46:39.127746+00:00"} {"global_step": 233781, "acc_step": 0, "speed/wps": 5528.038968805391, "speed/FLOPS": 244311027352745.84, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.27, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04527100548148155, "optim/lr": 1.851651499323359e-05, "optim/total_tokens": 1961097166848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2838549613952637, "created_at": "2025-06-03T06:46:42.098157+00:00"} {"global_step": 233782, "acc_step": 0, "speed/wps": 5522.524576807291, "speed/FLOPS": 244067319451646.75, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044347863644361496, "optim/lr": 1.8512967768139265e-05, "optim/total_tokens": 1961105555456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2842235565185547, "created_at": "2025-06-03T06:46:45.068247+00:00"} {"global_step": 233783, "acc_step": 0, "speed/wps": 5523.153722541454, "speed/FLOPS": 244095124472836.97, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044369813054800034, "optim/lr": 1.850942054304472e-05, "optim/total_tokens": 1961113944064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2873331308364868, "created_at": "2025-06-03T06:46:48.039448+00:00"} {"global_step": 233784, "acc_step": 0, "speed/wps": 5517.879530891791, "speed/FLOPS": 243862032197681.94, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.67, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0434301421046257, "optim/lr": 1.8505873317950173e-05, "optim/total_tokens": 1961122332672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2936762571334839, "created_at": "2025-06-03T06:46:51.013014+00:00"} {"global_step": 233785, "acc_step": 0, "speed/wps": 5522.644197451045, "speed/FLOPS": 244072606071826.75, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.3 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.3, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04357420653104782, "optim/lr": 1.8502326092855626e-05, "optim/total_tokens": 1961130721280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2870882749557495, "created_at": "2025-06-03T06:46:53.988480+00:00"} {"global_step": 233786, "acc_step": 0, "speed/wps": 5536.247943362856, "speed/FLOPS": 244673822010845.06, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04421968013048172, "optim/lr": 1.84987788677613e-05, "optim/total_tokens": 1961139109888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2775084972381592, "created_at": "2025-06-03T06:46:56.955428+00:00"} {"global_step": 233787, "acc_step": 0, "speed/wps": 5524.4331214548265, "speed/FLOPS": 244151667356250.75, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043722525238990784, "optim/lr": 1.8495231642666754e-05, "optim/total_tokens": 1961147498496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2803434133529663, "created_at": "2025-06-03T06:46:59.924989+00:00"} {"global_step": 233788, "acc_step": 0, "speed/wps": 5530.944723541487, "speed/FLOPS": 244439446839080.3, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.24, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0434199757874012, "optim/lr": 1.8491684417572207e-05, "optim/total_tokens": 1961155887104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2621709108352661, "created_at": "2025-06-03T06:47:02.890730+00:00"} {"global_step": 233789, "acc_step": 0, "speed/wps": 5528.9067099186195, "speed/FLOPS": 244349377068448.9, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04704538732767105, "optim/lr": 1.848813719247766e-05, "optim/total_tokens": 1961164275712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2753756046295166, "created_at": "2025-06-03T06:47:05.857679+00:00"} {"global_step": 233790, "acc_step": 0, "speed/wps": 5519.035268442688, "speed/FLOPS": 243913109881830.56, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043428801000118256, "optim/lr": 1.8484589967383335e-05, "optim/total_tokens": 1961172664320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2855480909347534, "created_at": "2025-06-03T06:47:08.832599+00:00"} {"global_step": 233791, "acc_step": 0, "speed/wps": 5527.1492185062425, "speed/FLOPS": 244271704943678.38, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04402872174978256, "optim/lr": 1.8481042742288788e-05, "optim/total_tokens": 1961181052928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2763885259628296, "created_at": "2025-06-03T06:47:11.804366+00:00"} {"global_step": 233792, "acc_step": 0, "speed/wps": 5521.86269085102, "speed/FLOPS": 244038067480219.0, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0449833907186985, "optim/lr": 1.8477495517194242e-05, "optim/total_tokens": 1961189441536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2926915884017944, "created_at": "2025-06-03T06:47:14.774943+00:00"} {"global_step": 233793, "acc_step": 0, "speed/wps": 5522.551214971829, "speed/FLOPS": 244068496722172.84, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043522708117961884, "optim/lr": 1.8473948292099695e-05, "optim/total_tokens": 1961197830144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2716035842895508, "created_at": "2025-06-03T06:47:17.745411+00:00"} {"global_step": 233794, "acc_step": 0, "speed/wps": 5523.661534476048, "speed/FLOPS": 244117567161128.9, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04691820964217186, "optim/lr": 1.8470401067005373e-05, "optim/total_tokens": 1961206218752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2691782712936401, "created_at": "2025-06-03T06:47:20.719283+00:00"} {"global_step": 233795, "acc_step": 0, "speed/wps": 5527.600099570656, "speed/FLOPS": 244291631578906.97, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04327401891350746, "optim/lr": 1.8466853841910823e-05, "optim/total_tokens": 1961214607360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2984910011291504, "created_at": "2025-06-03T06:47:23.686880+00:00"} {"global_step": 233796, "acc_step": 0, "speed/wps": 5520.990852751378, "speed/FLOPS": 243999536698686.78, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046997833997011185, "optim/lr": 1.8463306616816277e-05, "optim/total_tokens": 1961222995968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2950376272201538, "created_at": "2025-06-03T06:47:26.657908+00:00"} {"global_step": 233797, "acc_step": 0, "speed/wps": 5524.014026075326, "speed/FLOPS": 244133145485601.44, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04470726102590561, "optim/lr": 1.845975939172173e-05, "optim/total_tokens": 1961231384576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.288785696029663, "created_at": "2025-06-03T06:47:29.627936+00:00"} {"global_step": 233798, "acc_step": 0, "speed/wps": 5524.472986282457, "speed/FLOPS": 244153429177585.34, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05660286173224449, "optim/lr": 1.8456212166627407e-05, "optim/total_tokens": 1961239773184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2653003931045532, "created_at": "2025-06-03T06:47:32.600196+00:00"} {"global_step": 233799, "acc_step": 0, "speed/wps": 5517.694537905831, "speed/FLOPS": 243853856454582.44, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.29 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.29, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04447272792458534, "optim/lr": 1.845266494153286e-05, "optim/total_tokens": 1961248161792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2816671133041382, "created_at": "2025-06-03T06:47:35.573291+00:00"} {"global_step": 233800, "acc_step": 0, "speed/wps": 5521.703220993867, "speed/FLOPS": 244031019728773.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0508468933403492, "optim/lr": 1.844911771643831e-05, "optim/total_tokens": 1961256550400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.3004987239837646, "created_at": "2025-06-03T06:47:38.543746+00:00"} {"global_step": 233801, "acc_step": 0, "speed/wps": 5521.801091491686, "speed/FLOPS": 244035345103830.56, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04544380307197571, "optim/lr": 1.844557049134399e-05, "optim/total_tokens": 1961264939008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2826379537582397, "created_at": "2025-06-03T06:47:41.517581+00:00"} {"global_step": 233802, "acc_step": 0, "speed/wps": 5533.92237026937, "speed/FLOPS": 244571043583475.12, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.21, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044798385351896286, "optim/lr": 1.8442023266249442e-05, "optim/total_tokens": 1961273327616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.288549542427063, "created_at": "2025-06-03T06:47:44.481734+00:00"} {"global_step": 233803, "acc_step": 0, "speed/wps": 5519.747171054989, "speed/FLOPS": 243944572333446.38, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044030167162418365, "optim/lr": 1.8438476041154896e-05, "optim/total_tokens": 1961281716224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2815715074539185, "created_at": "2025-06-03T06:47:47.456862+00:00"} {"global_step": 233804, "acc_step": 0, "speed/wps": 5526.619124634514, "speed/FLOPS": 244248277507814.38, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04443272203207016, "optim/lr": 1.843492881606035e-05, "optim/total_tokens": 1961290104832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2936722040176392, "created_at": "2025-06-03T06:47:50.425088+00:00"} {"global_step": 233805, "acc_step": 0, "speed/wps": 5523.955544648071, "speed/FLOPS": 244130560905851.84, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04390864446759224, "optim/lr": 1.8431381590966023e-05, "optim/total_tokens": 1961298493440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.286172866821289, "created_at": "2025-06-03T06:47:53.398403+00:00"} {"global_step": 233806, "acc_step": 0, "speed/wps": 5518.905467877059, "speed/FLOPS": 243907373361209.28, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04504399001598358, "optim/lr": 1.8427834365871477e-05, "optim/total_tokens": 1961306882048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2692794799804688, "created_at": "2025-06-03T06:47:56.373457+00:00"} {"global_step": 233807, "acc_step": 0, "speed/wps": 5513.594996794663, "speed/FLOPS": 243672677720822.4, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043118879199028015, "optim/lr": 1.842428714077693e-05, "optim/total_tokens": 1961315270656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.28215491771698, "created_at": "2025-06-03T06:47:59.348475+00:00"} {"global_step": 233808, "acc_step": 0, "speed/wps": 5514.226193300782, "speed/FLOPS": 243700573375636.3, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045177049934864044, "optim/lr": 1.8420739915682384e-05, "optim/total_tokens": 1961323659264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2798041105270386, "created_at": "2025-06-03T06:48:02.323396+00:00"} {"global_step": 233809, "acc_step": 0, "speed/wps": 5513.700594510697, "speed/FLOPS": 243677344599373.0, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04371672123670578, "optim/lr": 1.8417192690588058e-05, "optim/total_tokens": 1961332047872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2973650693893433, "created_at": "2025-06-03T06:48:05.299554+00:00"} {"global_step": 233810, "acc_step": 0, "speed/wps": 5540.951114010551, "speed/FLOPS": 244881678080463.5, "speed/curr_iter_time": 2.9558, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9558, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 191.97, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044939540326595306, "optim/lr": 1.841364546549351e-05, "optim/total_tokens": 1961340436480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2938628196716309, "created_at": "2025-06-03T06:48:08.263167+00:00"} {"global_step": 233811, "acc_step": 0, "speed/wps": 5528.2790533555135, "speed/FLOPS": 244321637860997.16, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045348092913627625, "optim/lr": 1.8410098240398965e-05, "optim/total_tokens": 1961348825088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2684857845306396, "created_at": "2025-06-03T06:48:11.234311+00:00"} {"global_step": 233812, "acc_step": 0, "speed/wps": 5528.719969048873, "speed/FLOPS": 244341124077832.53, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04356546327471733, "optim/lr": 1.840655101530442e-05, "optim/total_tokens": 1961357213696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.312611699104309, "created_at": "2025-06-03T06:48:14.202443+00:00"} {"global_step": 233813, "acc_step": 0, "speed/wps": 5525.626735806971, "speed/FLOPS": 244204419001143.44, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0438440702855587, "optim/lr": 1.8403003790210092e-05, "optim/total_tokens": 1961365602304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2829395532608032, "created_at": "2025-06-03T06:48:17.175316+00:00"} {"global_step": 233814, "acc_step": 0, "speed/wps": 5520.739441720503, "speed/FLOPS": 243988425617960.4, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04321820288896561, "optim/lr": 1.8399456565115546e-05, "optim/total_tokens": 1961373990912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.293251395225525, "created_at": "2025-06-03T06:48:20.146584+00:00"} {"global_step": 233815, "acc_step": 0, "speed/wps": 5516.267053331575, "speed/FLOPS": 243790768942928.75, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04357895627617836, "optim/lr": 1.8395909340021e-05, "optim/total_tokens": 1961382379520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2793406248092651, "created_at": "2025-06-03T06:48:23.124211+00:00"} {"global_step": 233816, "acc_step": 0, "speed/wps": 5520.234007347826, "speed/FLOPS": 243966088005735.75, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0436725988984108, "optim/lr": 1.8392362114926453e-05, "optim/total_tokens": 1961390768128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2953650951385498, "created_at": "2025-06-03T06:48:26.098757+00:00"} {"global_step": 233817, "acc_step": 0, "speed/wps": 5510.159212209699, "speed/FLOPS": 243520833628106.72, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04544439911842346, "optim/lr": 1.8388814889832127e-05, "optim/total_tokens": 1961399156736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2880687713623047, "created_at": "2025-06-03T06:48:29.081605+00:00"} {"global_step": 233818, "acc_step": 0, "speed/wps": 5512.367489671036, "speed/FLOPS": 243618428188909.16, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04353409633040428, "optim/lr": 1.838526766473758e-05, "optim/total_tokens": 1961407545344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2774455547332764, "created_at": "2025-06-03T06:48:32.061075+00:00"} {"global_step": 233819, "acc_step": 0, "speed/wps": 5519.446059347429, "speed/FLOPS": 243931264737201.62, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04378041625022888, "optim/lr": 1.8381720439643034e-05, "optim/total_tokens": 1961415933952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2849842309951782, "created_at": "2025-06-03T06:48:35.035537+00:00"} {"global_step": 233820, "acc_step": 0, "speed/wps": 5522.681255568786, "speed/FLOPS": 244074243850950.22, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0462118498980999, "optim/lr": 1.8378173214548488e-05, "optim/total_tokens": 1961424322560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2793424129486084, "created_at": "2025-06-03T06:48:38.010055+00:00"} {"global_step": 233821, "acc_step": 0, "speed/wps": 5513.313418339133, "speed/FLOPS": 243660233394337.2, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04573880508542061, "optim/lr": 1.8374625989454165e-05, "optim/total_tokens": 1961432711168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2890931367874146, "created_at": "2025-06-03T06:48:40.985887+00:00"} {"global_step": 233822, "acc_step": 0, "speed/wps": 5526.332294430446, "speed/FLOPS": 244235601080924.66, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04579184576869011, "optim/lr": 1.8371078764359615e-05, "optim/total_tokens": 1961441099776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2791900634765625, "created_at": "2025-06-03T06:48:43.957263+00:00"} {"global_step": 233823, "acc_step": 0, "speed/wps": 5520.161388029764, "speed/FLOPS": 243962878603576.72, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05254415050148964, "optim/lr": 1.836753153926507e-05, "optim/total_tokens": 1961449488384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2799668312072754, "created_at": "2025-06-03T06:48:46.929184+00:00"} {"global_step": 233824, "acc_step": 0, "speed/wps": 5523.923146514616, "speed/FLOPS": 244129129074181.8, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04371701553463936, "optim/lr": 1.8363984314170522e-05, "optim/total_tokens": 1961457876992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2748814821243286, "created_at": "2025-06-03T06:48:49.902347+00:00"} {"global_step": 233825, "acc_step": 0, "speed/wps": 5523.000053505695, "speed/FLOPS": 244088333088005.88, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.048927195370197296, "optim/lr": 1.83604370890762e-05, "optim/total_tokens": 1961466265600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.275199294090271, "created_at": "2025-06-03T06:48:52.874029+00:00"} {"global_step": 233826, "acc_step": 0, "speed/wps": 5517.043517215639, "speed/FLOPS": 243825084672301.97, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04424426704645157, "optim/lr": 1.8356889863981653e-05, "optim/total_tokens": 1961474654208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2856463193893433, "created_at": "2025-06-03T06:48:55.847650+00:00"} {"global_step": 233827, "acc_step": 0, "speed/wps": 5507.323057222666, "speed/FLOPS": 243395490094437.06, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04651542752981186, "optim/lr": 1.8353342638887104e-05, "optim/total_tokens": 1961483042816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2674118280410767, "created_at": "2025-06-03T06:48:58.829274+00:00"} {"global_step": 233828, "acc_step": 0, "speed/wps": 5523.000965550348, "speed/FLOPS": 244088373395711.25, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045197077095508575, "optim/lr": 1.834979541379278e-05, "optim/total_tokens": 1961491431424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2887619733810425, "created_at": "2025-06-03T06:49:01.803513+00:00"} {"global_step": 233829, "acc_step": 0, "speed/wps": 5525.7374984915505, "speed/FLOPS": 244209314144867.06, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0458415150642395, "optim/lr": 1.8346248188698234e-05, "optim/total_tokens": 1961499820032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2709311246871948, "created_at": "2025-06-03T06:49:04.774962+00:00"} {"global_step": 233830, "acc_step": 0, "speed/wps": 5522.61379152852, "speed/FLOPS": 244071262285682.75, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04307854175567627, "optim/lr": 1.8342700963603688e-05, "optim/total_tokens": 1961508208640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2878679037094116, "created_at": "2025-06-03T06:49:07.746249+00:00"} {"global_step": 233831, "acc_step": 0, "speed/wps": 5533.6472643149455, "speed/FLOPS": 244558885308409.5, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04286753013730049, "optim/lr": 1.833915373850914e-05, "optim/total_tokens": 1961516597248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2761313915252686, "created_at": "2025-06-03T06:49:10.714651+00:00"} {"global_step": 233832, "acc_step": 0, "speed/wps": 5506.099793215127, "speed/FLOPS": 243341428086536.62, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04404847323894501, "optim/lr": 1.8335606513414815e-05, "optim/total_tokens": 1961524985856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.273439645767212, "created_at": "2025-06-03T06:49:13.694098+00:00"} {"global_step": 233833, "acc_step": 0, "speed/wps": 5501.868113663361, "speed/FLOPS": 243154409510048.03, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04592255502939224, "optim/lr": 1.833205928832027e-05, "optim/total_tokens": 1961533374464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.266554594039917, "created_at": "2025-06-03T06:49:16.676143+00:00"} {"global_step": 233834, "acc_step": 0, "speed/wps": 5494.229335558419, "speed/FLOPS": 242816814616620.3, "speed/curr_iter_time": 2.981, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.981, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "4.28 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 4.28, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04377232491970062, "optim/lr": 1.8328512063225723e-05, "optim/total_tokens": 1961541763072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.278991460800171, "created_at": "2025-06-03T06:49:19.661774+00:00"} {"global_step": 233835, "acc_step": 0, "speed/wps": 5504.491602523076, "speed/FLOPS": 243270354289414.12, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044850483536720276, "optim/lr": 1.8324964838131176e-05, "optim/total_tokens": 1961550151680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.288580060005188, "created_at": "2025-06-03T06:49:22.646355+00:00"} {"global_step": 233836, "acc_step": 0, "speed/wps": 5507.363008682406, "speed/FLOPS": 243397255744467.47, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.27 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.27, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043356504291296005, "optim/lr": 1.832141761303685e-05, "optim/total_tokens": 1961558540288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2719508409500122, "created_at": "2025-06-03T06:49:25.625160+00:00"} {"global_step": 233837, "acc_step": 0, "speed/wps": 5522.74134625538, "speed/FLOPS": 244076899551725.7, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04861026629805565, "optim/lr": 1.8317870387942304e-05, "optim/total_tokens": 1961566928896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.295186161994934, "created_at": "2025-06-03T06:49:28.595165+00:00"} {"global_step": 233838, "acc_step": 0, "speed/wps": 5516.082884496022, "speed/FLOPS": 243782629623058.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04412667825818062, "optim/lr": 1.8314323162847757e-05, "optim/total_tokens": 1961575317504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.289216160774231, "created_at": "2025-06-03T06:49:31.568673+00:00"} {"global_step": 233839, "acc_step": 0, "speed/wps": 5517.151866672613, "speed/FLOPS": 243829873163717.4, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04513516277074814, "optim/lr": 1.831077593775321e-05, "optim/total_tokens": 1961583706112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2896854877471924, "created_at": "2025-06-03T06:49:34.544501+00:00"} {"global_step": 233840, "acc_step": 0, "speed/wps": 5516.647330714211, "speed/FLOPS": 243807575256805.2, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043488625437021255, "optim/lr": 1.8307228712658885e-05, "optim/total_tokens": 1961592094720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.290406346321106, "created_at": "2025-06-03T06:49:37.518040+00:00"} {"global_step": 233841, "acc_step": 0, "speed/wps": 5512.386595770979, "speed/FLOPS": 243619272580732.72, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045963890850543976, "optim/lr": 1.8303681487564338e-05, "optim/total_tokens": 1961600483328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2893779277801514, "created_at": "2025-06-03T06:49:40.493521+00:00"} {"global_step": 233842, "acc_step": 0, "speed/wps": 5511.842713564728, "speed/FLOPS": 243595235771057.94, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0436357781291008, "optim/lr": 1.8300134262469792e-05, "optim/total_tokens": 1961608871936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2937345504760742, "created_at": "2025-06-03T06:49:43.471057+00:00"} {"global_step": 233843, "acc_step": 0, "speed/wps": 5520.259665510202, "speed/FLOPS": 243967221965182.34, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04622586444020271, "optim/lr": 1.8296587037375246e-05, "optim/total_tokens": 1961617260544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2801536321640015, "created_at": "2025-06-03T06:49:46.442943+00:00"} {"global_step": 233844, "acc_step": 0, "speed/wps": 5523.906628877075, "speed/FLOPS": 244128399079147.44, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04307728260755539, "optim/lr": 1.829303981228092e-05, "optim/total_tokens": 1961625649152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2601433992385864, "created_at": "2025-06-03T06:49:49.412101+00:00"} {"global_step": 233845, "acc_step": 0, "speed/wps": 5522.33613588366, "speed/FLOPS": 244058991327350.34, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04719111695885658, "optim/lr": 1.8289492587186373e-05, "optim/total_tokens": 1961634037760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2780156135559082, "created_at": "2025-06-03T06:49:52.385835+00:00"} {"global_step": 233846, "acc_step": 0, "speed/wps": 5521.82683875094, "speed/FLOPS": 244036483000903.16, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043768104165792465, "optim/lr": 1.8285945362091827e-05, "optim/total_tokens": 1961642426368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2837226390838623, "created_at": "2025-06-03T06:49:55.356521+00:00"} {"global_step": 233847, "acc_step": 0, "speed/wps": 5513.745307061724, "speed/FLOPS": 243679320665268.84, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04577413946390152, "optim/lr": 1.828239813699728e-05, "optim/total_tokens": 1961650814976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2798594236373901, "created_at": "2025-06-03T06:49:58.331572+00:00"} {"global_step": 233848, "acc_step": 0, "speed/wps": 5507.405958581303, "speed/FLOPS": 243399153910161.22, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04310956969857216, "optim/lr": 1.8278850911902954e-05, "optim/total_tokens": 1961659203584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.260182499885559, "created_at": "2025-06-03T06:50:01.315191+00:00"} {"global_step": 233849, "acc_step": 0, "speed/wps": 5509.73593717566, "speed/FLOPS": 243502127038120.25, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.047997623682022095, "optim/lr": 1.8275303686808408e-05, "optim/total_tokens": 1961667592192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2791290283203125, "created_at": "2025-06-03T06:50:04.292678+00:00"} {"global_step": 233850, "acc_step": 0, "speed/wps": 5505.934461937877, "speed/FLOPS": 243334121290324.38, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.26 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.26, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0452084094285965, "optim/lr": 1.827175646171386e-05, "optim/total_tokens": 1961675980800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.280636191368103, "created_at": "2025-06-03T06:50:07.272828+00:00"} {"global_step": 233851, "acc_step": 0, "speed/wps": 5514.025496878888, "speed/FLOPS": 243691703621045.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.047508757561445236, "optim/lr": 1.8268209236619315e-05, "optim/total_tokens": 1961684369408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2912471294403076, "created_at": "2025-06-03T06:50:10.247975+00:00"} {"global_step": 233852, "acc_step": 0, "speed/wps": 5525.028744960951, "speed/FLOPS": 244177990866544.0, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04576520994305611, "optim/lr": 1.8264662011524992e-05, "optim/total_tokens": 1961692758016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2831629514694214, "created_at": "2025-06-03T06:50:13.219506+00:00"} {"global_step": 233853, "acc_step": 0, "speed/wps": 5526.855325374317, "speed/FLOPS": 244258716371528.66, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043804995715618134, "optim/lr": 1.8261114786430442e-05, "optim/total_tokens": 1961701146624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2832729816436768, "created_at": "2025-06-03T06:50:16.190570+00:00"} {"global_step": 233854, "acc_step": 0, "speed/wps": 5515.285965647553, "speed/FLOPS": 243747409888956.97, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043791577219963074, "optim/lr": 1.8257567561335896e-05, "optim/total_tokens": 1961709535232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2936534881591797, "created_at": "2025-06-03T06:50:19.168868+00:00"} {"global_step": 233855, "acc_step": 0, "speed/wps": 5516.076069077149, "speed/FLOPS": 243782328416429.2, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044337548315525055, "optim/lr": 1.8254020336241573e-05, "optim/total_tokens": 1961717923840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2851539850234985, "created_at": "2025-06-03T06:50:22.144006+00:00"} {"global_step": 233856, "acc_step": 0, "speed/wps": 5523.207954159671, "speed/FLOPS": 244097521232779.6, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04407668113708496, "optim/lr": 1.8250473111147027e-05, "optim/total_tokens": 1961726312448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2915840148925781, "created_at": "2025-06-03T06:50:25.118494+00:00"} {"global_step": 233857, "acc_step": 0, "speed/wps": 5508.11375079951, "speed/FLOPS": 243430434703396.97, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.25 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.25, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04639957472681999, "optim/lr": 1.824692588605248e-05, "optim/total_tokens": 1961734701056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.285301923751831, "created_at": "2025-06-03T06:50:28.097245+00:00"} {"global_step": 233858, "acc_step": 0, "speed/wps": 5512.718898830139, "speed/FLOPS": 243633958675066.34, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044834740459918976, "optim/lr": 1.824337866095793e-05, "optim/total_tokens": 1961743089664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.272524118423462, "created_at": "2025-06-03T06:50:31.073035+00:00"} {"global_step": 233859, "acc_step": 0, "speed/wps": 5517.9390692996685, "speed/FLOPS": 243864663490564.94, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05190394073724747, "optim/lr": 1.8239831435863608e-05, "optim/total_tokens": 1961751478272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2696876525878906, "created_at": "2025-06-03T06:50:34.045899+00:00"} {"global_step": 233860, "acc_step": 0, "speed/wps": 5520.499336391345, "speed/FLOPS": 243977814191382.12, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044929105788469315, "optim/lr": 1.823628421076906e-05, "optim/total_tokens": 1961759866880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2853217124938965, "created_at": "2025-06-03T06:50:37.017265+00:00"} {"global_step": 233861, "acc_step": 0, "speed/wps": 5516.609085069241, "speed/FLOPS": 243805884995056.44, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05105350911617279, "optim/lr": 1.8232736985674515e-05, "optim/total_tokens": 1961768255488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2762545347213745, "created_at": "2025-06-03T06:50:39.991112+00:00"} {"global_step": 233862, "acc_step": 0, "speed/wps": 5518.41437683604, "speed/FLOPS": 243885669650828.06, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043192725628614426, "optim/lr": 1.822918976057997e-05, "optim/total_tokens": 1961776644096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2973827123641968, "created_at": "2025-06-03T06:50:42.963506+00:00"} {"global_step": 233863, "acc_step": 0, "speed/wps": 5526.375847988993, "speed/FLOPS": 244237525925285.1, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04601825028657913, "optim/lr": 1.8225642535485642e-05, "optim/total_tokens": 1961785032704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2704377174377441, "created_at": "2025-06-03T06:50:45.935064+00:00"} {"global_step": 233864, "acc_step": 0, "speed/wps": 5514.7824040455735, "speed/FLOPS": 243725155043611.4, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04618334770202637, "optim/lr": 1.8222095310391096e-05, "optim/total_tokens": 1961793421312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.261676549911499, "created_at": "2025-06-03T06:50:48.910216+00:00"} {"global_step": 233865, "acc_step": 0, "speed/wps": 5522.240368157895, "speed/FLOPS": 244054758884055.22, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.050870124250650406, "optim/lr": 1.821854808529655e-05, "optim/total_tokens": 1961801809920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2822545766830444, "created_at": "2025-06-03T06:50:51.885010+00:00"} {"global_step": 233866, "acc_step": 0, "speed/wps": 5505.632620537812, "speed/FLOPS": 243320781445405.84, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04418974369764328, "optim/lr": 1.8215000860202003e-05, "optim/total_tokens": 1961810198528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2856676578521729, "created_at": "2025-06-03T06:50:54.866394+00:00"} {"global_step": 233867, "acc_step": 0, "speed/wps": 5513.740280400768, "speed/FLOPS": 243679098512583.38, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.24 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.24, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.046000149101018906, "optim/lr": 1.8211453635107677e-05, "optim/total_tokens": 1961818587136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2962929010391235, "created_at": "2025-06-03T06:50:57.841060+00:00"} {"global_step": 233868, "acc_step": 0, "speed/wps": 5519.52316020798, "speed/FLOPS": 243934672200600.03, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05201094225049019, "optim/lr": 1.820790641001313e-05, "optim/total_tokens": 1961826975744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2836523056030273, "created_at": "2025-06-03T06:51:00.813188+00:00"} {"global_step": 233869, "acc_step": 0, "speed/wps": 5523.787806439746, "speed/FLOPS": 244123147735605.9, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04822419956326485, "optim/lr": 1.8204359184918584e-05, "optim/total_tokens": 1961835364352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2837274074554443, "created_at": "2025-06-03T06:51:03.783692+00:00"} {"global_step": 233870, "acc_step": 0, "speed/wps": 5532.43945779202, "speed/FLOPS": 244505506442210.4, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04960894212126732, "optim/lr": 1.8200811959824038e-05, "optim/total_tokens": 1961843752960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2843892574310303, "created_at": "2025-06-03T06:51:06.748830+00:00"} {"global_step": 233871, "acc_step": 0, "speed/wps": 5516.028876590224, "speed/FLOPS": 243780242750060.12, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045828912407159805, "optim/lr": 1.819726473472971e-05, "optim/total_tokens": 1961852141568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.29901123046875, "created_at": "2025-06-03T06:51:09.726928+00:00"} {"global_step": 233872, "acc_step": 0, "speed/wps": 5514.820903134428, "speed/FLOPS": 243726856506282.56, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.048124127089977264, "optim/lr": 1.8193717509635165e-05, "optim/total_tokens": 1961860530176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.304890513420105, "created_at": "2025-06-03T06:51:12.701838+00:00"} {"global_step": 233873, "acc_step": 0, "speed/wps": 5515.868985576403, "speed/FLOPS": 243773176385645.62, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0440322570502758, "optim/lr": 1.819017028454062e-05, "optim/total_tokens": 1961868918784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2775661945343018, "created_at": "2025-06-03T06:51:15.675938+00:00"} {"global_step": 233874, "acc_step": 0, "speed/wps": 5518.824162917265, "speed/FLOPS": 243903780098142.9, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05705270543694496, "optim/lr": 1.8186623059446073e-05, "optim/total_tokens": 1961877307392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2759039402008057, "created_at": "2025-06-03T06:51:18.648428+00:00"} {"global_step": 233875, "acc_step": 0, "speed/wps": 5512.6195539387045, "speed/FLOPS": 243629568139358.22, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04292672500014305, "optim/lr": 1.8183075834351746e-05, "optim/total_tokens": 1961885696000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2896660566329956, "created_at": "2025-06-03T06:51:21.626799+00:00"} {"global_step": 233876, "acc_step": 0, "speed/wps": 5516.931103642648, "speed/FLOPS": 243820116567760.56, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0490901917219162, "optim/lr": 1.81795286092572e-05, "optim/total_tokens": 1961894084608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2802040576934814, "created_at": "2025-06-03T06:51:24.600435+00:00"} {"global_step": 233877, "acc_step": 0, "speed/wps": 5506.874613852745, "speed/FLOPS": 243375671192827.8, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04381510242819786, "optim/lr": 1.8175981384162654e-05, "optim/total_tokens": 1961902473216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.3066648244857788, "created_at": "2025-06-03T06:51:27.579551+00:00"} {"global_step": 233878, "acc_step": 0, "speed/wps": 5524.700823103476, "speed/FLOPS": 244163498398899.8, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04362400248646736, "optim/lr": 1.8172434159068107e-05, "optim/total_tokens": 1961910861824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2753156423568726, "created_at": "2025-06-03T06:51:30.550116+00:00"} {"global_step": 233879, "acc_step": 0, "speed/wps": 5513.221324710984, "speed/FLOPS": 243656163327350.94, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.054137080907821655, "optim/lr": 1.8168886933973784e-05, "optim/total_tokens": 1961919250432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.282090663909912, "created_at": "2025-06-03T06:51:33.524976+00:00"} {"global_step": 233880, "acc_step": 0, "speed/wps": 5523.768715749534, "speed/FLOPS": 244122304024813.5, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044668130576610565, "optim/lr": 1.8165339708879235e-05, "optim/total_tokens": 1961927639040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2817821502685547, "created_at": "2025-06-03T06:51:36.500711+00:00"} {"global_step": 233881, "acc_step": 0, "speed/wps": 5507.749718115058, "speed/FLOPS": 243414346322032.4, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.23 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.23, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04855789616703987, "optim/lr": 1.8161792483784688e-05, "optim/total_tokens": 1961936027648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2528704404830933, "created_at": "2025-06-03T06:51:39.480249+00:00"} {"global_step": 233882, "acc_step": 0, "speed/wps": 5525.391827097327, "speed/FLOPS": 244194037238548.97, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.043449509888887405, "optim/lr": 1.8158245258690365e-05, "optim/total_tokens": 1961944416256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2790417671203613, "created_at": "2025-06-03T06:51:42.449333+00:00"} {"global_step": 233883, "acc_step": 0, "speed/wps": 5521.812246210318, "speed/FLOPS": 244035838085299.1, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05184681713581085, "optim/lr": 1.815469803359582e-05, "optim/total_tokens": 1961952804864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2811567783355713, "created_at": "2025-06-03T06:51:45.422323+00:00"} {"global_step": 233884, "acc_step": 0, "speed/wps": 5508.900861170109, "speed/FLOPS": 243465220952981.38, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04364049434661865, "optim/lr": 1.8151150808501273e-05, "optim/total_tokens": 1961961193472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2954978942871094, "created_at": "2025-06-03T06:51:48.400647+00:00"} {"global_step": 233885, "acc_step": 0, "speed/wps": 5513.413273783979, "speed/FLOPS": 243664646493892.88, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.048092328011989594, "optim/lr": 1.8147603583406723e-05, "optim/total_tokens": 1961969582080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2968143224716187, "created_at": "2025-06-03T06:51:51.377474+00:00"} {"global_step": 233886, "acc_step": 0, "speed/wps": 5516.881410823235, "speed/FLOPS": 243817920399493.4, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04340971261262894, "optim/lr": 1.81440563583124e-05, "optim/total_tokens": 1961977970688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2722119092941284, "created_at": "2025-06-03T06:51:54.351008+00:00"} {"global_step": 233887, "acc_step": 0, "speed/wps": 5520.5180991599345, "speed/FLOPS": 243978643409717.22, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04463083669543266, "optim/lr": 1.8140509133217854e-05, "optim/total_tokens": 1961986359296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2979910373687744, "created_at": "2025-06-03T06:51:57.323205+00:00"} {"global_step": 233888, "acc_step": 0, "speed/wps": 5528.513210805176, "speed/FLOPS": 244331986421745.75, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04438168928027153, "optim/lr": 1.8136961908123307e-05, "optim/total_tokens": 1961994747904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.293288230895996, "created_at": "2025-06-03T06:52:00.290242+00:00"} {"global_step": 233889, "acc_step": 0, "speed/wps": 5524.5055535100255, "speed/FLOPS": 244154868482349.7, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04413623362779617, "optim/lr": 1.813341468302876e-05, "optim/total_tokens": 1962003136512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2828487157821655, "created_at": "2025-06-03T06:52:03.263945+00:00"} {"global_step": 233890, "acc_step": 0, "speed/wps": 5514.685706185633, "speed/FLOPS": 243720881493146.53, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04353436455130577, "optim/lr": 1.8129867457934435e-05, "optim/total_tokens": 1962011525120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2736330032348633, "created_at": "2025-06-03T06:52:06.239240+00:00"} {"global_step": 233891, "acc_step": 0, "speed/wps": 5532.558149896677, "speed/FLOPS": 244510752025714.97, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.0428386889398098, "optim/lr": 1.812632023283989e-05, "optim/total_tokens": 1962019913728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.284198522567749, "created_at": "2025-06-03T06:52:09.208287+00:00"} {"global_step": 233892, "acc_step": 0, "speed/wps": 5513.741684927114, "speed/FLOPS": 243679160585458.84, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045421913266181946, "optim/lr": 1.8122773007745342e-05, "optim/total_tokens": 1962028302336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2857850790023804, "created_at": "2025-06-03T06:52:12.186745+00:00"} {"global_step": 233893, "acc_step": 0, "speed/wps": 5516.467432071904, "speed/FLOPS": 243799624657619.94, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04357585683465004, "optim/lr": 1.8119225782650796e-05, "optim/total_tokens": 1962036690944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2818810939788818, "created_at": "2025-06-03T06:52:15.160496+00:00"} {"global_step": 233894, "acc_step": 0, "speed/wps": 5526.097803526313, "speed/FLOPS": 244225237783195.22, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04375467449426651, "optim/lr": 1.811567855755647e-05, "optim/total_tokens": 1962045079552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2822593450546265, "created_at": "2025-06-03T06:52:18.130780+00:00"} {"global_step": 233895, "acc_step": 0, "speed/wps": 5528.613338306675, "speed/FLOPS": 244336411544813.0, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04347090423107147, "optim/lr": 1.8112131332461923e-05, "optim/total_tokens": 1962053468160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2865513563156128, "created_at": "2025-06-03T06:52:21.097796+00:00"} {"global_step": 233896, "acc_step": 0, "speed/wps": 5522.739745126201, "speed/FLOPS": 244076828790011.3, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.67, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.045899417251348495, "optim/lr": 1.8108584107367377e-05, "optim/total_tokens": 1962061856768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2728549242019653, "created_at": "2025-06-03T06:52:24.068023+00:00"} {"global_step": 233897, "acc_step": 0, "speed/wps": 5506.2649991322605, "speed/FLOPS": 243348729342473.4, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.22 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.22, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04356750473380089, "optim/lr": 1.810503688227283e-05, "optim/total_tokens": 1962070245376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.265380620956421, "created_at": "2025-06-03T06:52:27.051426+00:00"} {"global_step": 233898, "acc_step": 0, "speed/wps": 5514.731270127367, "speed/FLOPS": 243722895186153.78, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.05398070439696312, "optim/lr": 1.8101489657178504e-05, "optim/total_tokens": 1962078633984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2886719703674316, "created_at": "2025-06-03T06:52:30.026605+00:00"} {"global_step": 233899, "acc_step": 0, "speed/wps": 5521.457483327797, "speed/FLOPS": 244020159381732.66, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04480423405766487, "optim/lr": 1.8097942432083958e-05, "optim/total_tokens": 1962087022592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2849667072296143, "created_at": "2025-06-03T06:52:32.997462+00:00"} {"global_step": 233900, "acc_step": 0, "speed/wps": 5524.598753183869, "speed/FLOPS": 244158987430894.4, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04927191883325577, "optim/lr": 1.809439520698941e-05, "optim/total_tokens": 1962095411200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2745040655136108, "created_at": "2025-06-03T06:52:35.971704+00:00"} {"global_step": 233901, "acc_step": 0, "speed/wps": 5504.440796183903, "speed/FLOPS": 243268108909273.12, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04393242672085762, "optim/lr": 1.8090847981894865e-05, "optim/total_tokens": 1962103799808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.292820692062378, "created_at": "2025-06-03T06:52:38.957013+00:00"} {"global_step": 233902, "acc_step": 0, "speed/wps": 5502.6642777307125, "speed/FLOPS": 243189595886687.84, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04791288822889328, "optim/lr": 1.808730075680054e-05, "optim/total_tokens": 1962112188416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2919890880584717, "created_at": "2025-06-03T06:52:41.939856+00:00"} {"global_step": 233903, "acc_step": 0, "speed/wps": 5522.276088250588, "speed/FLOPS": 244056337529320.22, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043808020651340485, "optim/lr": 1.8083753531705992e-05, "optim/total_tokens": 1962120577024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.286255955696106, "created_at": "2025-06-03T06:52:44.914705+00:00"} {"global_step": 233904, "acc_step": 0, "speed/wps": 5524.35003023301, "speed/FLOPS": 244147995149545.9, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.06262222677469254, "optim/lr": 1.8080206306611446e-05, "optim/total_tokens": 1962128965632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2879211902618408, "created_at": "2025-06-03T06:52:47.886590+00:00"} {"global_step": 233905, "acc_step": 0, "speed/wps": 5527.570556080627, "speed/FLOPS": 244290325907864.97, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045086245983839035, "optim/lr": 1.80766590815169e-05, "optim/total_tokens": 1962137354240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2816828489303589, "created_at": "2025-06-03T06:52:50.859602+00:00"} {"global_step": 233906, "acc_step": 0, "speed/wps": 5514.454080236013, "speed/FLOPS": 243710644811742.44, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.050271760672330856, "optim/lr": 1.8073111856422573e-05, "optim/total_tokens": 1962145742848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2884372472763062, "created_at": "2025-06-03T06:52:53.834550+00:00"} {"global_step": 233907, "acc_step": 0, "speed/wps": 5528.768287682084, "speed/FLOPS": 244343259514103.25, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04677693545818329, "optim/lr": 1.8069564631328027e-05, "optim/total_tokens": 1962154131456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.297420859336853, "created_at": "2025-06-03T06:52:56.805188+00:00"} {"global_step": 233908, "acc_step": 0, "speed/wps": 5527.98368342121, "speed/FLOPS": 244308584021741.3, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047604240477085114, "optim/lr": 1.806601740623348e-05, "optim/total_tokens": 1962162520064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2907025814056396, "created_at": "2025-06-03T06:52:59.775435+00:00"} {"global_step": 233909, "acc_step": 0, "speed/wps": 5509.695104452324, "speed/FLOPS": 243500322440749.6, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04719790071249008, "optim/lr": 1.8062470181139158e-05, "optim/total_tokens": 1962170908672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2986246347427368, "created_at": "2025-06-03T06:53:02.756752+00:00"} {"global_step": 233910, "acc_step": 0, "speed/wps": 5505.4629104843025, "speed/FLOPS": 243313281129695.53, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.21 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.21, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.044794611632823944, "optim/lr": 1.805892295604461e-05, "optim/total_tokens": 1962179297280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.277443766593933, "created_at": "2025-06-03T06:53:05.736120+00:00"} {"global_step": 233911, "acc_step": 0, "speed/wps": 5511.386262557196, "speed/FLOPS": 243575062972853.06, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0023, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.049340296536684036, "optim/lr": 1.805537573095006e-05, "optim/total_tokens": 1962187685888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2728509902954102, "created_at": "2025-06-03T06:53:08.714130+00:00"} {"global_step": 233912, "acc_step": 0, "speed/wps": 5520.947481057444, "speed/FLOPS": 243997619891811.34, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04490870237350464, "optim/lr": 1.8051828505855515e-05, "optim/total_tokens": 1962196074496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2756798267364502, "created_at": "2025-06-03T06:53:11.685401+00:00"} {"global_step": 233913, "acc_step": 0, "speed/wps": 5527.857430596723, "speed/FLOPS": 244303004293119.53, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04825626686215401, "optim/lr": 1.8048281280761192e-05, "optim/total_tokens": 1962204463104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2856184244155884, "created_at": "2025-06-03T06:53:14.654048+00:00"} {"global_step": 233914, "acc_step": 0, "speed/wps": 5520.282252685381, "speed/FLOPS": 243968220202713.62, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04452531412243843, "optim/lr": 1.8044734055666646e-05, "optim/total_tokens": 1962212851712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2776291370391846, "created_at": "2025-06-03T06:53:17.625709+00:00"} {"global_step": 233915, "acc_step": 0, "speed/wps": 5519.955174583604, "speed/FLOPS": 243953765024752.6, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0450081042945385, "optim/lr": 1.80411868305721e-05, "optim/total_tokens": 1962221240320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2882163524627686, "created_at": "2025-06-03T06:53:20.602613+00:00"} {"global_step": 233916, "acc_step": 0, "speed/wps": 5515.062088529183, "speed/FLOPS": 243737515666231.97, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04624316468834877, "optim/lr": 1.8037639605477553e-05, "optim/total_tokens": 1962229628928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2834054231643677, "created_at": "2025-06-03T06:53:23.579595+00:00"} {"global_step": 233917, "acc_step": 0, "speed/wps": 5502.218166900957, "speed/FLOPS": 243169880071414.88, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04357035085558891, "optim/lr": 1.8034092380383227e-05, "optim/total_tokens": 1962238017536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.290865421295166, "created_at": "2025-06-03T06:53:26.564265+00:00"} {"global_step": 233918, "acc_step": 0, "speed/wps": 5511.035435021647, "speed/FLOPS": 243559558191479.9, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04541381821036339, "optim/lr": 1.803054515528868e-05, "optim/total_tokens": 1962246406144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2817593812942505, "created_at": "2025-06-03T06:53:29.540923+00:00"} {"global_step": 233919, "acc_step": 0, "speed/wps": 5500.537078066982, "speed/FLOPS": 243095584549545.84, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.2 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.2, "speed/est_time_remaining_days": 0.18, "optim/grad_norm": 0.04491914436221123, "optim/lr": 1.8026997930194134e-05, "optim/total_tokens": 1962254794752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2936257123947144, "created_at": "2025-06-03T06:53:32.526218+00:00"} {"global_step": 233920, "acc_step": 0, "speed/wps": 5519.492632354491, "speed/FLOPS": 243933323025731.56, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04439501464366913, "optim/lr": 1.8023450705099588e-05, "optim/total_tokens": 1962263183360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2874270677566528, "created_at": "2025-06-03T06:53:35.502619+00:00"} {"global_step": 233921, "acc_step": 0, "speed/wps": 5516.529682709122, "speed/FLOPS": 243802375817157.34, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04339129850268364, "optim/lr": 1.8019903480005262e-05, "optim/total_tokens": 1962271571968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2621533870697021, "created_at": "2025-06-03T06:53:38.475970+00:00"} {"global_step": 233922, "acc_step": 0, "speed/wps": 5512.709344179937, "speed/FLOPS": 243633536408432.56, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04405338689684868, "optim/lr": 1.8016356254910715e-05, "optim/total_tokens": 1962279960576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2739309072494507, "created_at": "2025-06-03T06:53:41.451913+00:00"} {"global_step": 233923, "acc_step": 0, "speed/wps": 5515.947354998781, "speed/FLOPS": 243776639912983.66, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0447695218026638, "optim/lr": 1.801280902981617e-05, "optim/total_tokens": 1962288349184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.273084282875061, "created_at": "2025-06-03T06:53:44.428685+00:00"} {"global_step": 233924, "acc_step": 0, "speed/wps": 5509.911063757687, "speed/FLOPS": 243509866736666.72, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04551272094249725, "optim/lr": 1.8009261804721623e-05, "optim/total_tokens": 1962296737792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.290734052658081, "created_at": "2025-06-03T06:53:47.409876+00:00"} {"global_step": 233925, "acc_step": 0, "speed/wps": 5519.878182457835, "speed/FLOPS": 243950362366875.0, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045297883450984955, "optim/lr": 1.8005714579627296e-05, "optim/total_tokens": 1962305126400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.287571907043457, "created_at": "2025-06-03T06:53:50.383592+00:00"} {"global_step": 233926, "acc_step": 0, "speed/wps": 5512.388639560654, "speed/FLOPS": 243619362905775.3, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043275658041238785, "optim/lr": 1.800216735453275e-05, "optim/total_tokens": 1962313515008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2905939817428589, "created_at": "2025-06-03T06:53:53.365557+00:00"} {"global_step": 233927, "acc_step": 0, "speed/wps": 5504.670887984334, "speed/FLOPS": 243278277789135.56, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04431469738483429, "optim/lr": 1.7998620129438204e-05, "optim/total_tokens": 1962321903616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2790573835372925, "created_at": "2025-06-03T06:53:56.347239+00:00"} {"global_step": 233928, "acc_step": 0, "speed/wps": 5513.818032876149, "speed/FLOPS": 243682534774021.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04329164698719978, "optim/lr": 1.7995072904343657e-05, "optim/total_tokens": 1962330292224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2956064939498901, "created_at": "2025-06-03T06:53:59.322642+00:00"} {"global_step": 233929, "acc_step": 0, "speed/wps": 5533.028047445969, "speed/FLOPS": 244531519092239.97, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.28, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04364125430583954, "optim/lr": 1.799152567924933e-05, "optim/total_tokens": 1962338680832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.3000822067260742, "created_at": "2025-06-03T06:54:02.287026+00:00"} {"global_step": 233930, "acc_step": 0, "speed/wps": 5520.615107778496, "speed/FLOPS": 243982930694122.5, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04437262937426567, "optim/lr": 1.7987978454154785e-05, "optim/total_tokens": 1962347069440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2730296850204468, "created_at": "2025-06-03T06:54:05.258552+00:00"} {"global_step": 233931, "acc_step": 0, "speed/wps": 5532.874006829347, "speed/FLOPS": 244524711285436.66, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.34, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04398493468761444, "optim/lr": 1.7984431229060238e-05, "optim/total_tokens": 1962355458048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2703685760498047, "created_at": "2025-06-03T06:54:08.224342+00:00"} {"global_step": 233932, "acc_step": 0, "speed/wps": 5522.0802693808755, "speed/FLOPS": 244047683337570.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04659087210893631, "optim/lr": 1.7980884003965692e-05, "optim/total_tokens": 1962363846656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2725584506988525, "created_at": "2025-06-03T06:54:11.197786+00:00"} {"global_step": 233933, "acc_step": 0, "speed/wps": 5517.611527261307, "speed/FLOPS": 243850187808981.5, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04308890178799629, "optim/lr": 1.7977336778871366e-05, "optim/total_tokens": 1962372235264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2765389680862427, "created_at": "2025-06-03T06:54:14.170622+00:00"} {"global_step": 233934, "acc_step": 0, "speed/wps": 5516.568092889969, "speed/FLOPS": 243804073350549.62, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04666563868522644, "optim/lr": 1.797378955377682e-05, "optim/total_tokens": 1962380623872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2859691381454468, "created_at": "2025-06-03T06:54:17.144335+00:00"} {"global_step": 233935, "acc_step": 0, "speed/wps": 5504.916713296016, "speed/FLOPS": 243289142009663.88, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.19 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.19, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04636591300368309, "optim/lr": 1.7970242328682273e-05, "optim/total_tokens": 1962389012480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2776721715927124, "created_at": "2025-06-03T06:54:20.123961+00:00"} {"global_step": 233936, "acc_step": 0, "speed/wps": 5512.970511068137, "speed/FLOPS": 243645078648117.7, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04978640750050545, "optim/lr": 1.796669510358795e-05, "optim/total_tokens": 1962397401088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2871211767196655, "created_at": "2025-06-03T06:54:23.099526+00:00"} {"global_step": 233937, "acc_step": 0, "speed/wps": 5527.409191612565, "speed/FLOPS": 244283194424314.84, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046488504856824875, "optim/lr": 1.7963147878493404e-05, "optim/total_tokens": 1962405789696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2961193323135376, "created_at": "2025-06-03T06:54:26.070074+00:00"} {"global_step": 233938, "acc_step": 0, "speed/wps": 5525.791641573687, "speed/FLOPS": 244211706991968.1, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046742573380470276, "optim/lr": 1.7959600653398854e-05, "optim/total_tokens": 1962414178304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.271948218345642, "created_at": "2025-06-03T06:54:29.038780+00:00"} {"global_step": 233939, "acc_step": 0, "speed/wps": 5521.1178971672, "speed/FLOPS": 244005151411593.8, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04464494436979294, "optim/lr": 1.7956053428304308e-05, "optim/total_tokens": 1962422566912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2981579303741455, "created_at": "2025-06-03T06:54:32.009635+00:00"} {"global_step": 233940, "acc_step": 0, "speed/wps": 5510.703815200226, "speed/FLOPS": 243544902292757.22, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04548472911119461, "optim/lr": 1.7952506203209985e-05, "optim/total_tokens": 1962430955520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2853432893753052, "created_at": "2025-06-03T06:54:34.990567+00:00"} {"global_step": 233941, "acc_step": 0, "speed/wps": 5518.177293332588, "speed/FLOPS": 243875191773478.88, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04505284130573273, "optim/lr": 1.794895897811544e-05, "optim/total_tokens": 1962439344128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2835997343063354, "created_at": "2025-06-03T06:54:37.966428+00:00"} {"global_step": 233942, "acc_step": 0, "speed/wps": 5516.537537602954, "speed/FLOPS": 243802722963259.72, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04448457062244415, "optim/lr": 1.7945411753020892e-05, "optim/total_tokens": 1962447732736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.3023444414138794, "created_at": "2025-06-03T06:54:40.943252+00:00"} {"global_step": 233943, "acc_step": 0, "speed/wps": 5509.7717942173, "speed/FLOPS": 243503711735827.75, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.18 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.18, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04370689392089844, "optim/lr": 1.7941864527926342e-05, "optim/total_tokens": 1962456121344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2838680744171143, "created_at": "2025-06-03T06:54:43.920410+00:00"} {"global_step": 233944, "acc_step": 0, "speed/wps": 5518.854357887972, "speed/FLOPS": 243905114561296.25, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04976972937583923, "optim/lr": 1.793831730283202e-05, "optim/total_tokens": 1962464509952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2924054861068726, "created_at": "2025-06-03T06:54:46.895764+00:00"} {"global_step": 233945, "acc_step": 0, "speed/wps": 5527.016233811693, "speed/FLOPS": 244265827700856.66, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04408205300569534, "optim/lr": 1.7934770077737473e-05, "optim/total_tokens": 1962472898560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.28928804397583, "created_at": "2025-06-03T06:54:49.863820+00:00"} {"global_step": 233946, "acc_step": 0, "speed/wps": 5518.13945010245, "speed/FLOPS": 243873519296405.94, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.17 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.17, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05041375383734703, "optim/lr": 1.7931222852642927e-05, "optim/total_tokens": 1962481287168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.288048267364502, "created_at": "2025-06-03T06:54:52.836695+00:00"} {"global_step": 233947, "acc_step": 0, "speed/wps": 5522.190138493784, "speed/FLOPS": 244052538990000.22, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04542166367173195, "optim/lr": 1.792767562754838e-05, "optim/total_tokens": 1962489675776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2499358654022217, "created_at": "2025-06-03T06:54:55.807180+00:00"} {"global_step": 233948, "acc_step": 0, "speed/wps": 5523.307146513933, "speed/FLOPS": 244101905027125.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0448761023581028, "optim/lr": 1.7924128402454054e-05, "optim/total_tokens": 1962498064384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.286662220954895, "created_at": "2025-06-03T06:54:58.777120+00:00"} {"global_step": 233949, "acc_step": 0, "speed/wps": 5520.37940199134, "speed/FLOPS": 243972513704781.8, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04346059635281563, "optim/lr": 1.7920581177359508e-05, "optim/total_tokens": 1962506452992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2853574752807617, "created_at": "2025-06-03T06:55:01.749111+00:00"} {"global_step": 233950, "acc_step": 0, "speed/wps": 5515.580730251747, "speed/FLOPS": 243760436975720.3, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045204099267721176, "optim/lr": 1.791703395226496e-05, "optim/total_tokens": 1962514841600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2721400260925293, "created_at": "2025-06-03T06:55:04.725857+00:00"} {"global_step": 233951, "acc_step": 0, "speed/wps": 5523.352695226008, "speed/FLOPS": 244103918047059.75, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04343793913722038, "optim/lr": 1.7913486727170415e-05, "optim/total_tokens": 1962523230208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2967032194137573, "created_at": "2025-06-03T06:55:07.695594+00:00"} {"global_step": 233952, "acc_step": 0, "speed/wps": 5513.768304962544, "speed/FLOPS": 243680337054771.16, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04414425045251846, "optim/lr": 1.790993950207609e-05, "optim/total_tokens": 1962531618816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2737785577774048, "created_at": "2025-06-03T06:55:10.671796+00:00"} {"global_step": 233953, "acc_step": 0, "speed/wps": 5513.252499840593, "speed/FLOPS": 243657541108510.88, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04334113746881485, "optim/lr": 1.7906392276981542e-05, "optim/total_tokens": 1962540007424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2801514863967896, "created_at": "2025-06-03T06:55:13.650329+00:00"} {"global_step": 233954, "acc_step": 0, "speed/wps": 5524.804027618432, "speed/FLOPS": 244168059510212.28, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04358847066760063, "optim/lr": 1.7902845051886996e-05, "optim/total_tokens": 1962548396032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.291619896888733, "created_at": "2025-06-03T06:55:16.619183+00:00"} {"global_step": 233955, "acc_step": 0, "speed/wps": 5516.3650118675, "speed/FLOPS": 243795098208819.38, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044576846063137054, "optim/lr": 1.789929782679245e-05, "optim/total_tokens": 1962556784640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2829294204711914, "created_at": "2025-06-03T06:55:19.592983+00:00"} {"global_step": 233956, "acc_step": 0, "speed/wps": 5512.297654604155, "speed/FLOPS": 243615341836401.25, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04665946215391159, "optim/lr": 1.7895750601698123e-05, "optim/total_tokens": 1962565173248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2817572355270386, "created_at": "2025-06-03T06:55:22.571303+00:00"} {"global_step": 233957, "acc_step": 0, "speed/wps": 5530.427067742994, "speed/FLOPS": 244416569102389.47, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.44, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.042935267090797424, "optim/lr": 1.7892203376603577e-05, "optim/total_tokens": 1962573561856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2879416942596436, "created_at": "2025-06-03T06:55:25.536965+00:00"} {"global_step": 233958, "acc_step": 0, "speed/wps": 5538.973351600776, "speed/FLOPS": 244794271105057.2, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044392697513103485, "optim/lr": 1.788865615150903e-05, "optim/total_tokens": 1962581950464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2692209482192993, "created_at": "2025-06-03T06:55:28.498024+00:00"} {"global_step": 233959, "acc_step": 0, "speed/wps": 5517.530776540975, "speed/FLOPS": 243846619040462.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043440524488687515, "optim/lr": 1.7885108926414484e-05, "optim/total_tokens": 1962590339072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2682569026947021, "created_at": "2025-06-03T06:55:31.470900+00:00"} {"global_step": 233960, "acc_step": 0, "speed/wps": 5515.963275086713, "speed/FLOPS": 243777343499383.88, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.16 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.16, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044700685888528824, "optim/lr": 1.7881561701320158e-05, "optim/total_tokens": 1962598727680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2782235145568848, "created_at": "2025-06-03T06:55:34.444315+00:00"} {"global_step": 233961, "acc_step": 0, "speed/wps": 5528.000641477594, "speed/FLOPS": 244309333481034.28, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04374454915523529, "optim/lr": 1.787801447622561e-05, "optim/total_tokens": 1962607116288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2855108976364136, "created_at": "2025-06-03T06:55:37.414504+00:00"} {"global_step": 233962, "acc_step": 0, "speed/wps": 5530.013557745153, "speed/FLOPS": 244398294077020.94, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.46, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04374072700738907, "optim/lr": 1.7874467251131065e-05, "optim/total_tokens": 1962615504896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2902112007141113, "created_at": "2025-06-03T06:55:40.380421+00:00"} {"global_step": 233963, "acc_step": 0, "speed/wps": 5524.665912229206, "speed/FLOPS": 244161955516947.12, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04480735957622528, "optim/lr": 1.7870920026036742e-05, "optim/total_tokens": 1962623893504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2825626134872437, "created_at": "2025-06-03T06:55:43.352679+00:00"} {"global_step": 233964, "acc_step": 0, "speed/wps": 5518.802567149868, "speed/FLOPS": 243902825675761.1, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04343358799815178, "optim/lr": 1.7867372800942193e-05, "optim/total_tokens": 1962632282112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2743440866470337, "created_at": "2025-06-03T06:55:46.325370+00:00"} {"global_step": 233965, "acc_step": 0, "speed/wps": 5518.970716922193, "speed/FLOPS": 243910257035029.3, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04330134019255638, "optim/lr": 1.7863825575847646e-05, "optim/total_tokens": 1962640670720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.284144401550293, "created_at": "2025-06-03T06:55:49.296956+00:00"} {"global_step": 233966, "acc_step": 0, "speed/wps": 5516.61769443412, "speed/FLOPS": 243806265484917.38, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04315921291708946, "optim/lr": 1.78602783507531e-05, "optim/total_tokens": 1962649059328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.291996717453003, "created_at": "2025-06-03T06:55:52.273150+00:00"} {"global_step": 233967, "acc_step": 0, "speed/wps": 5517.445990633725, "speed/FLOPS": 243842871937335.66, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043852098286151886, "optim/lr": 1.7856731125658777e-05, "optim/total_tokens": 1962657447936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2853230237960815, "created_at": "2025-06-03T06:55:55.246207+00:00"} {"global_step": 233968, "acc_step": 0, "speed/wps": 5526.541012886523, "speed/FLOPS": 244244825368365.34, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04478911682963371, "optim/lr": 1.785318390056423e-05, "optim/total_tokens": 1962665836544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2858904600143433, "created_at": "2025-06-03T06:55:58.217779+00:00"} {"global_step": 233969, "acc_step": 0, "speed/wps": 5524.633508798757, "speed/FLOPS": 244160523451177.1, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0441456139087677, "optim/lr": 1.784963667546968e-05, "optim/total_tokens": 1962674225152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.270775318145752, "created_at": "2025-06-03T06:56:01.186693+00:00"} {"global_step": 233970, "acc_step": 0, "speed/wps": 5519.715409368548, "speed/FLOPS": 243943168629476.72, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045508597046136856, "optim/lr": 1.7846089450375135e-05, "optim/total_tokens": 1962682613760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2627716064453125, "created_at": "2025-06-03T06:56:04.159400+00:00"} {"global_step": 233971, "acc_step": 0, "speed/wps": 5527.627554401377, "speed/FLOPS": 244292844941898.25, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04765079542994499, "optim/lr": 1.7842542225280812e-05, "optim/total_tokens": 1962691002368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.294366717338562, "created_at": "2025-06-03T06:56:07.126920+00:00"} {"global_step": 233972, "acc_step": 0, "speed/wps": 5527.844246544863, "speed/FLOPS": 244302421625509.4, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04407593607902527, "optim/lr": 1.7838995000186265e-05, "optim/total_tokens": 1962699390976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.290324330329895, "created_at": "2025-06-03T06:56:10.097805+00:00"} {"global_step": 233973, "acc_step": 0, "speed/wps": 5525.64924586702, "speed/FLOPS": 244205413830580.7, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04526452347636223, "optim/lr": 1.783544777509172e-05, "optim/total_tokens": 1962707779584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2852120399475098, "created_at": "2025-06-03T06:56:13.066228+00:00"} {"global_step": 233974, "acc_step": 0, "speed/wps": 5524.785191027693, "speed/FLOPS": 244167227029316.03, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048902761191129684, "optim/lr": 1.7831900549997173e-05, "optim/total_tokens": 1962716168192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2862356901168823, "created_at": "2025-06-03T06:56:16.035136+00:00"} {"global_step": 233975, "acc_step": 0, "speed/wps": 5526.092930942093, "speed/FLOPS": 244225022439912.8, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04351203143596649, "optim/lr": 1.7828353324902846e-05, "optim/total_tokens": 1962724556800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2890688180923462, "created_at": "2025-06-03T06:56:19.007033+00:00"} {"global_step": 233976, "acc_step": 0, "speed/wps": 5511.424977559416, "speed/FLOPS": 243576773977789.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.058761876076459885, "optim/lr": 1.78248060998083e-05, "optim/total_tokens": 1962732945408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2869489192962646, "created_at": "2025-06-03T06:56:21.983051+00:00"} {"global_step": 233977, "acc_step": 0, "speed/wps": 5504.60538455078, "speed/FLOPS": 243275382872649.47, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.15 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.15, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0466683954000473, "optim/lr": 1.7821258874713754e-05, "optim/total_tokens": 1962741334016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2766003608703613, "created_at": "2025-06-03T06:56:24.962951+00:00"} {"global_step": 233978, "acc_step": 0, "speed/wps": 5525.100374901969, "speed/FLOPS": 244181156543301.72, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05699910596013069, "optim/lr": 1.7817711649619207e-05, "optim/total_tokens": 1962749722624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2890774011611938, "created_at": "2025-06-03T06:56:27.933665+00:00"} {"global_step": 233979, "acc_step": 0, "speed/wps": 5533.592421944032, "speed/FLOPS": 244556461556323.8, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.29, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04678637534379959, "optim/lr": 1.781416442452488e-05, "optim/total_tokens": 1962758111232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2937848567962646, "created_at": "2025-06-03T06:56:30.898036+00:00"} {"global_step": 233980, "acc_step": 0, "speed/wps": 5532.716943218098, "speed/FLOPS": 244517769877743.88, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.38, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04959326237440109, "optim/lr": 1.7810617199430335e-05, "optim/total_tokens": 1962766499840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2752094268798828, "created_at": "2025-06-03T06:56:33.863031+00:00"} {"global_step": 233981, "acc_step": 0, "speed/wps": 5517.572268438854, "speed/FLOPS": 243848452769973.94, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04338245838880539, "optim/lr": 1.7807069974335788e-05, "optim/total_tokens": 1962774888448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.293238878250122, "created_at": "2025-06-03T06:56:36.838967+00:00"} {"global_step": 233982, "acc_step": 0, "speed/wps": 5512.281982795481, "speed/FLOPS": 243614649222673.47, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.14 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.14, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.049340732395648956, "optim/lr": 1.7803522749241242e-05, "optim/total_tokens": 1962783277056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.282279133796692, "created_at": "2025-06-03T06:56:39.816412+00:00"} {"global_step": 233983, "acc_step": 0, "speed/wps": 5524.805777424774, "speed/FLOPS": 244168136842696.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043812643736600876, "optim/lr": 1.7799975524146916e-05, "optim/total_tokens": 1962791665664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2766129970550537, "created_at": "2025-06-03T06:56:42.785297+00:00"} {"global_step": 233984, "acc_step": 0, "speed/wps": 5520.377822152604, "speed/FLOPS": 243972443883996.0, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04736689478158951, "optim/lr": 1.779642829905237e-05, "optim/total_tokens": 1962800054272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.270946741104126, "created_at": "2025-06-03T06:56:45.756749+00:00"} {"global_step": 233985, "acc_step": 0, "speed/wps": 5517.686716924485, "speed/FLOPS": 243853510807238.38, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04344609007239342, "optim/lr": 1.7792881073957823e-05, "optim/total_tokens": 1962808442880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2990286350250244, "created_at": "2025-06-03T06:56:48.732660+00:00"} {"global_step": 233986, "acc_step": 0, "speed/wps": 5518.182871157215, "speed/FLOPS": 243875438284777.47, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045115385204553604, "optim/lr": 1.7789333848863277e-05, "optim/total_tokens": 1962816831488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2809252738952637, "created_at": "2025-06-03T06:56:51.708191+00:00"} {"global_step": 233987, "acc_step": 0, "speed/wps": 5519.105937921972, "speed/FLOPS": 243916233111095.75, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045304931700229645, "optim/lr": 1.778578662376895e-05, "optim/total_tokens": 1962825220096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2890260219573975, "created_at": "2025-06-03T06:56:54.683414+00:00"} {"global_step": 233988, "acc_step": 0, "speed/wps": 5521.389869826173, "speed/FLOPS": 244017171211038.16, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0441334992647171, "optim/lr": 1.7782239398674404e-05, "optim/total_tokens": 1962833608704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2887741327285767, "created_at": "2025-06-03T06:56:57.655165+00:00"} {"global_step": 233989, "acc_step": 0, "speed/wps": 5521.3272729154105, "speed/FLOPS": 244014404747982.5, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04432415962219238, "optim/lr": 1.7778692173579858e-05, "optim/total_tokens": 1962841997312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2847039699554443, "created_at": "2025-06-03T06:57:00.625872+00:00"} {"global_step": 233990, "acc_step": 0, "speed/wps": 5520.700820538739, "speed/FLOPS": 243986718759407.56, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045020442456007004, "optim/lr": 1.7775144948485535e-05, "optim/total_tokens": 1962850385920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2837047576904297, "created_at": "2025-06-03T06:57:03.601790+00:00"} {"global_step": 233991, "acc_step": 0, "speed/wps": 5522.41970393819, "speed/FLOPS": 244062684607620.5, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04338699206709862, "optim/lr": 1.7771597723390985e-05, "optim/total_tokens": 1962858774528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2725006341934204, "created_at": "2025-06-03T06:57:06.572109+00:00"} {"global_step": 233992, "acc_step": 0, "speed/wps": 5527.76073265419, "speed/FLOPS": 244298730739004.5, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04334946721792221, "optim/lr": 1.776805049829644e-05, "optim/total_tokens": 1962867163136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2736221551895142, "created_at": "2025-06-03T06:57:09.541427+00:00"} {"global_step": 233993, "acc_step": 0, "speed/wps": 5517.075885741362, "speed/FLOPS": 243826515195461.78, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04485497251152992, "optim/lr": 1.7764503273201892e-05, "optim/total_tokens": 1962875551744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.288511037826538, "created_at": "2025-06-03T06:57:12.514792+00:00"} {"global_step": 233994, "acc_step": 0, "speed/wps": 5512.804852007339, "speed/FLOPS": 243637757365550.34, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.13 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.13, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0428924635052681, "optim/lr": 1.776095604810757e-05, "optim/total_tokens": 1962883940352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2730567455291748, "created_at": "2025-06-03T06:57:15.491161+00:00"} {"global_step": 233995, "acc_step": 0, "speed/wps": 5532.690777619099, "speed/FLOPS": 244516613492195.8, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.4, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04379432648420334, "optim/lr": 1.7757408823013023e-05, "optim/total_tokens": 1962892328960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.273226261138916, "created_at": "2025-06-03T06:57:18.455829+00:00"} {"global_step": 233996, "acc_step": 0, "speed/wps": 5521.134310627083, "speed/FLOPS": 244005876802508.97, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04398244619369507, "optim/lr": 1.7753861597918473e-05, "optim/total_tokens": 1962900717568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2859410047531128, "created_at": "2025-06-03T06:57:21.426675+00:00"} {"global_step": 233997, "acc_step": 0, "speed/wps": 5528.811780604009, "speed/FLOPS": 244345181678635.4, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047818731516599655, "optim/lr": 1.7750314372823927e-05, "optim/total_tokens": 1962909106176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.3034462928771973, "created_at": "2025-06-03T06:57:24.393415+00:00"} {"global_step": 233998, "acc_step": 0, "speed/wps": 5525.994777626728, "speed/FLOPS": 244220684565767.9, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04334637150168419, "optim/lr": 1.7746767147729604e-05, "optim/total_tokens": 1962917494784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2712376117706299, "created_at": "2025-06-03T06:57:27.365601+00:00"} {"global_step": 233999, "acc_step": 0, "speed/wps": 5521.099761035642, "speed/FLOPS": 244004349887408.1, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04739067703485489, "optim/lr": 1.7743219922635058e-05, "optim/total_tokens": 1962925883392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2859195470809937, "created_at": "2025-06-03T06:57:30.342542+00:00"} {"global_step": 234000, "acc_step": 0, "speed/wps": 5517.769028921372, "speed/FLOPS": 243857148576189.8, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.12 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.12, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04357128590345383, "optim/lr": 1.773967269754051e-05, "optim/total_tokens": 1962934272000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2972676753997803, "created_at": "2025-06-03T06:57:33.316299+00:00"} {"global_step": 234001, "acc_step": 0, "speed/wps": 234.4526688265777, "speed/FLOPS": 10361607924589.643, "speed/curr_iter_time": 7.2856, "speed/data_load_time": 2.3847, "speed/curr_step_time": 7.2856, "speed/est_time_elapsed": "19.73 days", "speed/est_time_remaining": "10.12 hours", "speed/est_time_elapsed_hrs": 473.57, "speed/est_time_elapsed_days": 19.73, "speed/est_time_remaining_hrs": 10.12, "speed/est_time_remaining_days": 0.42, "optim/grad_norm": 0.04369959607720375, "optim/lr": 1.773612547244596e-05, "optim/total_tokens": 1962942660608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.28864586353302, "created_at": "2025-06-03T06:58:43.207200+00:00"} {"global_step": 234002, "acc_step": 0, "speed/wps": 5631.438176628087, "speed/FLOPS": 248880743093386.12, "speed/curr_iter_time": 2.9063, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9063, "speed/est_time_elapsed": "7.87 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 188.91, "speed/est_time_elapsed_days": 7.87, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04356478527188301, "optim/lr": 1.773257824735164e-05, "optim/total_tokens": 1962951049216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2825320959091187, "created_at": "2025-06-03T06:58:46.124317+00:00"} {"global_step": 234003, "acc_step": 0, "speed/wps": 5581.6010816862245, "speed/FLOPS": 246678198586332.16, "speed/curr_iter_time": 2.9341, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9341, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 190.72, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04437318816781044, "optim/lr": 1.7729031022257092e-05, "optim/total_tokens": 1962959437824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2926222085952759, "created_at": "2025-06-03T06:58:49.063701+00:00"} {"global_step": 234004, "acc_step": 0, "speed/wps": 5567.576267710682, "speed/FLOPS": 246058373594118.62, "speed/curr_iter_time": 2.9404, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9404, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 191.13, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04434552043676376, "optim/lr": 1.7725483797162546e-05, "optim/total_tokens": 1962967826432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2709535360336304, "created_at": "2025-06-03T06:58:52.015629+00:00"} {"global_step": 234005, "acc_step": 0, "speed/wps": 5534.417203529528, "speed/FLOPS": 244592912680787.88, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.11 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.11, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046335458755493164, "optim/lr": 1.7721936572068e-05, "optim/total_tokens": 1962976215040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.3060117959976196, "created_at": "2025-06-03T06:58:54.983301+00:00"} {"global_step": 234006, "acc_step": 0, "speed/wps": 5561.365722052413, "speed/FLOPS": 245783899264477.5, "speed/curr_iter_time": 2.9447, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9447, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 191.41, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043765898793935776, "optim/lr": 1.7718389346973673e-05, "optim/total_tokens": 1962984603648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2686243057250977, "created_at": "2025-06-03T06:58:57.934628+00:00"} {"global_step": 234007, "acc_step": 0, "speed/wps": 5564.029285508366, "speed/FLOPS": 245901615135876.97, "speed/curr_iter_time": 2.9432, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9432, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 191.31, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04447989538311958, "optim/lr": 1.7714842121879127e-05, "optim/total_tokens": 1962992992256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.275307059288025, "created_at": "2025-06-03T06:59:00.883162+00:00"} {"global_step": 234008, "acc_step": 0, "speed/wps": 5544.696627200674, "speed/FLOPS": 245047210592192.53, "speed/curr_iter_time": 2.9527, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9527, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 191.93, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044163551181554794, "optim/lr": 1.771129489678458e-05, "optim/total_tokens": 1963001380864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2769255638122559, "created_at": "2025-06-03T06:59:03.842965+00:00"} {"global_step": 234009, "acc_step": 0, "speed/wps": 5548.492891824744, "speed/FLOPS": 245214986057532.62, "speed/curr_iter_time": 2.9515, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9515, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 191.85, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04419340938329697, "optim/lr": 1.7707747671690034e-05, "optim/total_tokens": 1963009769472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2828013896942139, "created_at": "2025-06-03T06:59:06.803975+00:00"} {"global_step": 234010, "acc_step": 0, "speed/wps": 5533.756387030419, "speed/FLOPS": 244563707973892.75, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04392235726118088, "optim/lr": 1.7704200446595708e-05, "optim/total_tokens": 1963018158080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2860404253005981, "created_at": "2025-06-03T06:59:09.768540+00:00"} {"global_step": 234011, "acc_step": 0, "speed/wps": 5551.045765534781, "speed/FLOPS": 245327810008724.06, "speed/curr_iter_time": 2.9493, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9493, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04429931938648224, "optim/lr": 1.770065322150116e-05, "optim/total_tokens": 1963026546688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2906450033187866, "created_at": "2025-06-03T06:59:12.726608+00:00"} {"global_step": 234012, "acc_step": 0, "speed/wps": 5519.849539797915, "speed/FLOPS": 243949096507912.97, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.11 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.11, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045587338507175446, "optim/lr": 1.7697105996406615e-05, "optim/total_tokens": 1963034935296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2793219089508057, "created_at": "2025-06-03T06:59:15.698411+00:00"} {"global_step": 234013, "acc_step": 0, "speed/wps": 5534.4278760643365, "speed/FLOPS": 244593384352199.44, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04367213696241379, "optim/lr": 1.769355877131207e-05, "optim/total_tokens": 1963043323904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2876794338226318, "created_at": "2025-06-03T06:59:18.668249+00:00"} {"global_step": 234014, "acc_step": 0, "speed/wps": 5520.2616960878695, "speed/FLOPS": 243967311706321.8, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.11 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.11, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044083546847105026, "optim/lr": 1.7690011546217743e-05, "optim/total_tokens": 1963051712512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.292718529701233, "created_at": "2025-06-03T06:59:21.643035+00:00"} {"global_step": 234015, "acc_step": 0, "speed/wps": 5549.734636332354, "speed/FLOPS": 245269864808944.44, "speed/curr_iter_time": 2.9509, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9509, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 191.82, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04437137395143509, "optim/lr": 1.7686464321123196e-05, "optim/total_tokens": 1963060101120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2773096561431885, "created_at": "2025-06-03T06:59:24.604512+00:00"} {"global_step": 234016, "acc_step": 0, "speed/wps": 5535.517433754448, "speed/FLOPS": 244641537225240.53, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.32, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045217208564281464, "optim/lr": 1.768291709602865e-05, "optim/total_tokens": 1963068489728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2738592624664307, "created_at": "2025-06-03T06:59:27.568599+00:00"} {"global_step": 234017, "acc_step": 0, "speed/wps": 5527.02694554331, "speed/FLOPS": 244266301104566.5, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0461910143494606, "optim/lr": 1.7679369870934324e-05, "optim/total_tokens": 1963076878336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2836101055145264, "created_at": "2025-06-03T06:59:30.536337+00:00"} {"global_step": 234018, "acc_step": 0, "speed/wps": 5539.606254426235, "speed/FLOPS": 244822242170452.12, "speed/curr_iter_time": 2.9553, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9553, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.11, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04390284791588783, "optim/lr": 1.7675822645839777e-05, "optim/total_tokens": 1963085266944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2892506122589111, "created_at": "2025-06-03T06:59:33.500759+00:00"} {"global_step": 234019, "acc_step": 0, "speed/wps": 5529.118921602747, "speed/FLOPS": 244358755738689.47, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048294808715581894, "optim/lr": 1.767227542074523e-05, "optim/total_tokens": 1963093655552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2752069234848022, "created_at": "2025-06-03T06:59:36.468519+00:00"} {"global_step": 234020, "acc_step": 0, "speed/wps": 5526.928965676615, "speed/FLOPS": 244261970895965.0, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04740999639034271, "optim/lr": 1.7668728195650685e-05, "optim/total_tokens": 1963102044160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.286380410194397, "created_at": "2025-06-03T06:59:39.436080+00:00"} {"global_step": 234021, "acc_step": 0, "speed/wps": 5513.026060648556, "speed/FLOPS": 243647533655243.7, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.11 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.11, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04997798800468445, "optim/lr": 1.7665180970556362e-05, "optim/total_tokens": 1963110432768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2840814590454102, "created_at": "2025-06-03T06:59:42.414485+00:00"} {"global_step": 234022, "acc_step": 0, "speed/wps": 5519.225323067549, "speed/FLOPS": 243921509323461.66, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043963994830846786, "optim/lr": 1.7661633745461812e-05, "optim/total_tokens": 1963118821376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2773879766464233, "created_at": "2025-06-03T06:59:45.393076+00:00"} {"global_step": 234023, "acc_step": 0, "speed/wps": 5539.260179146412, "speed/FLOPS": 244806947414457.8, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.18, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04519985243678093, "optim/lr": 1.7658086520367266e-05, "optim/total_tokens": 1963127209984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2758773565292358, "created_at": "2025-06-03T06:59:48.354827+00:00"} {"global_step": 234024, "acc_step": 0, "speed/wps": 5533.728128454293, "speed/FLOPS": 244562459089468.47, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.23, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04381990060210228, "optim/lr": 1.765453929527272e-05, "optim/total_tokens": 1963135598592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2683320045471191, "created_at": "2025-06-03T06:59:51.323373+00:00"} {"global_step": 234025, "acc_step": 0, "speed/wps": 5548.366100746484, "speed/FLOPS": 245209382540849.12, "speed/curr_iter_time": 2.9515, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9515, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 191.87, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046037159860134125, "optim/lr": 1.7650992070178396e-05, "optim/total_tokens": 1963143987200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2825084924697876, "created_at": "2025-06-03T06:59:54.280316+00:00"} {"global_step": 234026, "acc_step": 0, "speed/wps": 5540.902825653381, "speed/FLOPS": 244879543982238.84, "speed/curr_iter_time": 2.9556, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9556, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0448019839823246, "optim/lr": 1.764744484508385e-05, "optim/total_tokens": 1963152375808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.264802098274231, "created_at": "2025-06-03T06:59:57.240611+00:00"} {"global_step": 234027, "acc_step": 0, "speed/wps": 5546.0882774799975, "speed/FLOPS": 245108714411426.78, "speed/curr_iter_time": 2.9529, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9529, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 191.96, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043799988925457, "optim/lr": 1.7643897619989304e-05, "optim/total_tokens": 1963160764416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2736109495162964, "created_at": "2025-06-03T07:00:00.202195+00:00"} {"global_step": 234028, "acc_step": 0, "speed/wps": 5527.128320301531, "speed/FLOPS": 244270781349996.8, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.53, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04631488025188446, "optim/lr": 1.7640350394894754e-05, "optim/total_tokens": 1963169153024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2838873863220215, "created_at": "2025-06-03T07:00:03.171880+00:00"} {"global_step": 234029, "acc_step": 0, "speed/wps": 5518.287200191881, "speed/FLOPS": 243880049094105.3, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04508870840072632, "optim/lr": 1.763680316980043e-05, "optim/total_tokens": 1963177541632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2859737873077393, "created_at": "2025-06-03T07:00:06.148738+00:00"} {"global_step": 234030, "acc_step": 0, "speed/wps": 5539.474078133339, "speed/FLOPS": 244816400654845.75, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.2, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04420757293701172, "optim/lr": 1.7633255944705885e-05, "optim/total_tokens": 1963185930240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2719275951385498, "created_at": "2025-06-03T07:00:09.114379+00:00"} {"global_step": 234031, "acc_step": 0, "speed/wps": 5525.929270828807, "speed/FLOPS": 244217789500593.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04368237033486366, "optim/lr": 1.762970871961134e-05, "optim/total_tokens": 1963194318848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2856029272079468, "created_at": "2025-06-03T07:00:12.087664+00:00"} {"global_step": 234032, "acc_step": 0, "speed/wps": 5526.951687771076, "speed/FLOPS": 244262975096237.94, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04518342763185501, "optim/lr": 1.7626161494516792e-05, "optim/total_tokens": 1963202707456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2845029830932617, "created_at": "2025-06-03T07:00:15.058473+00:00"} {"global_step": 234033, "acc_step": 0, "speed/wps": 5535.0003148721, "speed/FLOPS": 244618683217495.16, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04427538067102432, "optim/lr": 1.7622614269422466e-05, "optim/total_tokens": 1963211096064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2928870916366577, "created_at": "2025-06-03T07:00:18.022321+00:00"} {"global_step": 234034, "acc_step": 0, "speed/wps": 5534.911874093041, "speed/FLOPS": 244614774587741.7, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04535597562789917, "optim/lr": 1.761906704432792e-05, "optim/total_tokens": 1963219484672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2635669708251953, "created_at": "2025-06-03T07:00:20.985905+00:00"} {"global_step": 234035, "acc_step": 0, "speed/wps": 5532.715534663008, "speed/FLOPS": 244517707626818.53, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.35, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0441073477268219, "optim/lr": 1.7615519819233373e-05, "optim/total_tokens": 1963227873280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2783688306808472, "created_at": "2025-06-03T07:00:23.954432+00:00"} {"global_step": 234036, "acc_step": 0, "speed/wps": 5527.0031358188235, "speed/FLOPS": 244265248836613.4, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044172581285238266, "optim/lr": 1.7611972594138827e-05, "optim/total_tokens": 1963236261888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2926599979400635, "created_at": "2025-06-03T07:00:26.927016+00:00"} {"global_step": 234037, "acc_step": 0, "speed/wps": 5513.21736375444, "speed/FLOPS": 243655988273345.7, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.1 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.1, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04383937641978264, "optim/lr": 1.76084253690445e-05, "optim/total_tokens": 1963244650496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2849236726760864, "created_at": "2025-06-03T07:00:29.905942+00:00"} {"global_step": 234038, "acc_step": 0, "speed/wps": 5518.6288211870315, "speed/FLOPS": 243895146993516.2, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043316252529621124, "optim/lr": 1.7604878143949954e-05, "optim/total_tokens": 1963253039104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2833696603775024, "created_at": "2025-06-03T07:00:32.882448+00:00"} {"global_step": 234039, "acc_step": 0, "speed/wps": 5526.800879729122, "speed/FLOPS": 244256310152689.16, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04646419361233711, "optim/lr": 1.7601330918855408e-05, "optim/total_tokens": 1963261427712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.286622166633606, "created_at": "2025-06-03T07:00:35.856629+00:00"} {"global_step": 234040, "acc_step": 0, "speed/wps": 5531.880516512545, "speed/FLOPS": 244480804098578.4, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045154016464948654, "optim/lr": 1.759778369376086e-05, "optim/total_tokens": 1963269816320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.270113229751587, "created_at": "2025-06-03T07:00:38.822791+00:00"} {"global_step": 234041, "acc_step": 0, "speed/wps": 5528.832382250246, "speed/FLOPS": 244346092165950.3, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043837424367666245, "optim/lr": 1.7594236468666535e-05, "optim/total_tokens": 1963278204928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2770344018936157, "created_at": "2025-06-03T07:00:41.793815+00:00"} {"global_step": 234042, "acc_step": 0, "speed/wps": 5521.0229119785345, "speed/FLOPS": 244000953552433.1, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04380515217781067, "optim/lr": 1.759068924357199e-05, "optim/total_tokens": 1963286593536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2665021419525146, "created_at": "2025-06-03T07:00:44.769872+00:00"} {"global_step": 234043, "acc_step": 0, "speed/wps": 5525.093430898276, "speed/FLOPS": 244180849653881.1, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045305609703063965, "optim/lr": 1.7587142018477442e-05, "optim/total_tokens": 1963294982144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2759491205215454, "created_at": "2025-06-03T07:00:47.742994+00:00"} {"global_step": 234044, "acc_step": 0, "speed/wps": 5522.994333726824, "speed/FLOPS": 244088080303056.25, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04441872984170914, "optim/lr": 1.7583594793383116e-05, "optim/total_tokens": 1963303370752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2694801092147827, "created_at": "2025-06-03T07:00:50.715870+00:00"} {"global_step": 234045, "acc_step": 0, "speed/wps": 5522.362246972356, "speed/FLOPS": 244060145303822.03, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046087317168712616, "optim/lr": 1.758004756828857e-05, "optim/total_tokens": 1963311759360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2863953113555908, "created_at": "2025-06-03T07:00:53.690572+00:00"} {"global_step": 234046, "acc_step": 0, "speed/wps": 5510.451479475548, "speed/FLOPS": 243533750345297.78, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0488116629421711, "optim/lr": 1.7576500343194023e-05, "optim/total_tokens": 1963320147968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2928996086120605, "created_at": "2025-06-03T07:00:56.670357+00:00"} {"global_step": 234047, "acc_step": 0, "speed/wps": 5510.565479980021, "speed/FLOPS": 243538788584088.03, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.09 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.09, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04420190677046776, "optim/lr": 1.7572953118099477e-05, "optim/total_tokens": 1963328536576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2703402042388916, "created_at": "2025-06-03T07:00:59.649911+00:00"} {"global_step": 234048, "acc_step": 0, "speed/wps": 5533.215406642573, "speed/FLOPS": 244539799409738.56, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.36, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.043939024209976196, "optim/lr": 1.7569405893005154e-05, "optim/total_tokens": 1963336925184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.29221510887146, "created_at": "2025-06-03T07:01:02.614727+00:00"} {"global_step": 234049, "acc_step": 0, "speed/wps": 5529.940223294985, "speed/FLOPS": 244395053069683.25, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.050514061003923416, "optim/lr": 1.7565858667910604e-05, "optim/total_tokens": 1963345313792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2867170572280884, "created_at": "2025-06-03T07:01:05.581147+00:00"} {"global_step": 234050, "acc_step": 0, "speed/wps": 5529.910606548201, "speed/FLOPS": 244393744161067.66, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04519190266728401, "optim/lr": 1.7562311442816058e-05, "optim/total_tokens": 1963353702400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2956645488739014, "created_at": "2025-06-03T07:01:08.548138+00:00"} {"global_step": 234051, "acc_step": 0, "speed/wps": 5533.195038154949, "speed/FLOPS": 244538899226840.97, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04792209714651108, "optim/lr": 1.755876421772151e-05, "optim/total_tokens": 1963362091008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2829359769821167, "created_at": "2025-06-03T07:01:11.516918+00:00"} {"global_step": 234052, "acc_step": 0, "speed/wps": 5523.705619589709, "speed/FLOPS": 244119515497504.7, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04869462922215462, "optim/lr": 1.755521699262719e-05, "optim/total_tokens": 1963370479616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2724543809890747, "created_at": "2025-06-03T07:01:14.490805+00:00"} {"global_step": 234053, "acc_step": 0, "speed/wps": 5519.774029228024, "speed/FLOPS": 243945759327221.94, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0453285351395607, "optim/lr": 1.7551669767532642e-05, "optim/total_tokens": 1963378868224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.278161883354187, "created_at": "2025-06-03T07:01:17.462833+00:00"} {"global_step": 234054, "acc_step": 0, "speed/wps": 5511.861100642926, "speed/FLOPS": 243596048385800.72, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04572378844022751, "optim/lr": 1.7548122542438093e-05, "optim/total_tokens": 1963387256832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.292357087135315, "created_at": "2025-06-03T07:01:20.439701+00:00"} {"global_step": 234055, "acc_step": 0, "speed/wps": 5507.244354684869, "speed/FLOPS": 243392011845102.56, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04503874108195305, "optim/lr": 1.7544575317343546e-05, "optim/total_tokens": 1963395645440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2883899211883545, "created_at": "2025-06-03T07:01:23.421406+00:00"} {"global_step": 234056, "acc_step": 0, "speed/wps": 5509.402728913447, "speed/FLOPS": 243487400938444.94, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04543893039226532, "optim/lr": 1.7541028092249223e-05, "optim/total_tokens": 1963404034048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2725780010223389, "created_at": "2025-06-03T07:01:26.399040+00:00"} {"global_step": 234057, "acc_step": 0, "speed/wps": 5530.897552345181, "speed/FLOPS": 244437362113647.62, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05060332268476486, "optim/lr": 1.7537480867154677e-05, "optim/total_tokens": 1963412422656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2821719646453857, "created_at": "2025-06-03T07:01:29.370487+00:00"} {"global_step": 234058, "acc_step": 0, "speed/wps": 5524.8103284880035, "speed/FLOPS": 244168337976396.56, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04337436705827713, "optim/lr": 1.753393364206013e-05, "optim/total_tokens": 1963420811264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2750029563903809, "created_at": "2025-06-03T07:01:32.343855+00:00"} {"global_step": 234059, "acc_step": 0, "speed/wps": 5530.111995991362, "speed/FLOPS": 244402644543650.75, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04715992510318756, "optim/lr": 1.753038641696558e-05, "optim/total_tokens": 1963429199872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2733458280563354, "created_at": "2025-06-03T07:01:35.310497+00:00"} {"global_step": 234060, "acc_step": 0, "speed/wps": 5521.768113321852, "speed/FLOPS": 244033887637521.47, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04543134570121765, "optim/lr": 1.7526839191871258e-05, "optim/total_tokens": 1963437588480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2905597686767578, "created_at": "2025-06-03T07:01:38.281640+00:00"} {"global_step": 234061, "acc_step": 0, "speed/wps": 5524.921451885512, "speed/FLOPS": 244173249061785.34, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04489424079656601, "optim/lr": 1.7523291966776712e-05, "optim/total_tokens": 1963445977088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2837814092636108, "created_at": "2025-06-03T07:01:41.250801+00:00"} {"global_step": 234062, "acc_step": 0, "speed/wps": 5526.692237335283, "speed/FLOPS": 244251508714963.62, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04392595216631889, "optim/lr": 1.7519744741682165e-05, "optim/total_tokens": 1963454365696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2856236696243286, "created_at": "2025-06-03T07:01:44.223796+00:00"} {"global_step": 234063, "acc_step": 0, "speed/wps": 5518.981372818478, "speed/FLOPS": 243910727971103.28, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044191766530275345, "optim/lr": 1.751619751658762e-05, "optim/total_tokens": 1963462754304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2980575561523438, "created_at": "2025-06-03T07:01:47.200962+00:00"} {"global_step": 234064, "acc_step": 0, "speed/wps": 5508.563327445305, "speed/FLOPS": 243450303689999.22, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.08 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.08, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04891369491815567, "optim/lr": 1.7512650291493293e-05, "optim/total_tokens": 1963471142912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2888121604919434, "created_at": "2025-06-03T07:01:50.179287+00:00"} {"global_step": 234065, "acc_step": 0, "speed/wps": 5531.260388012085, "speed/FLOPS": 244453397592963.5, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.41, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04538438096642494, "optim/lr": 1.7509103066398746e-05, "optim/total_tokens": 1963479531520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2798186540603638, "created_at": "2025-06-03T07:01:53.145445+00:00"} {"global_step": 234066, "acc_step": 0, "speed/wps": 5533.708597363226, "speed/FLOPS": 244561595915212.47, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0455956868827343, "optim/lr": 1.75055558413042e-05, "optim/total_tokens": 1963487920128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2781412601470947, "created_at": "2025-06-03T07:01:56.109946+00:00"} {"global_step": 234067, "acc_step": 0, "speed/wps": 5519.772312915752, "speed/FLOPS": 243945683475004.38, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04425263777375221, "optim/lr": 1.7502008616209654e-05, "optim/total_tokens": 1963496308736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.288420557975769, "created_at": "2025-06-03T07:01:59.082382+00:00"} {"global_step": 234068, "acc_step": 0, "speed/wps": 5522.079270106262, "speed/FLOPS": 244047639174747.6, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04450167343020439, "optim/lr": 1.7498461391115327e-05, "optim/total_tokens": 1963504697344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2894861698150635, "created_at": "2025-06-03T07:02:02.053752+00:00"} {"global_step": 234069, "acc_step": 0, "speed/wps": 5521.928776371487, "speed/FLOPS": 244040988121967.3, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04324634000658989, "optim/lr": 1.749491416602078e-05, "optim/total_tokens": 1963513085952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2665092945098877, "created_at": "2025-06-03T07:02:05.028108+00:00"} {"global_step": 234070, "acc_step": 0, "speed/wps": 5526.255240183464, "speed/FLOPS": 244232195677607.4, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04853913187980652, "optim/lr": 1.7491366940926235e-05, "optim/total_tokens": 1963521474560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2716326713562012, "created_at": "2025-06-03T07:02:07.996233+00:00"} {"global_step": 234071, "acc_step": 0, "speed/wps": 5513.35858854563, "speed/FLOPS": 243662229686262.25, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04389045014977455, "optim/lr": 1.7487819715831688e-05, "optim/total_tokens": 1963529863168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2951083183288574, "created_at": "2025-06-03T07:02:10.975969+00:00"} {"global_step": 234072, "acc_step": 0, "speed/wps": 5508.071399062572, "speed/FLOPS": 243428562973400.16, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05054410174489021, "optim/lr": 1.7484272490737362e-05, "optim/total_tokens": 1963538251776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2856523990631104, "created_at": "2025-06-03T07:02:13.957563+00:00"} {"global_step": 234073, "acc_step": 0, "speed/wps": 5517.83772068592, "speed/FLOPS": 243860184400586.5, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04469606280326843, "optim/lr": 1.7480725265642816e-05, "optim/total_tokens": 1963546640384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2756695747375488, "created_at": "2025-06-03T07:02:16.934406+00:00"} {"global_step": 234074, "acc_step": 0, "speed/wps": 5530.763373062849, "speed/FLOPS": 244431432076160.38, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.56, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04708646237850189, "optim/lr": 1.747717804054827e-05, "optim/total_tokens": 1963555028992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.288391351699829, "created_at": "2025-06-03T07:02:19.903553+00:00"} {"global_step": 234075, "acc_step": 0, "speed/wps": 5519.37110658365, "speed/FLOPS": 243927952208685.62, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04370548576116562, "optim/lr": 1.7473630815453943e-05, "optim/total_tokens": 1963563417600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2780897617340088, "created_at": "2025-06-03T07:02:22.877748+00:00"} {"global_step": 234076, "acc_step": 0, "speed/wps": 5526.155334345638, "speed/FLOPS": 244227780350939.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04917396605014801, "optim/lr": 1.7470083590359397e-05, "optim/total_tokens": 1963571806208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2759965658187866, "created_at": "2025-06-03T07:02:25.850666+00:00"} {"global_step": 234077, "acc_step": 0, "speed/wps": 5524.032110674122, "speed/FLOPS": 244133944732302.88, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04495660960674286, "optim/lr": 1.746653636526485e-05, "optim/total_tokens": 1963580194816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2737609148025513, "created_at": "2025-06-03T07:02:28.824108+00:00"} {"global_step": 234078, "acc_step": 0, "speed/wps": 5508.541658394251, "speed/FLOPS": 243449346028854.88, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05540887266397476, "optim/lr": 1.7462989140170304e-05, "optim/total_tokens": 1963588583424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.294968605041504, "created_at": "2025-06-03T07:02:31.806670+00:00"} {"global_step": 234079, "acc_step": 0, "speed/wps": 5509.66037563013, "speed/FLOPS": 243498787604566.88, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0461493656039238, "optim/lr": 1.745944191507598e-05, "optim/total_tokens": 1963596972032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2767969369888306, "created_at": "2025-06-03T07:02:34.788781+00:00"} {"global_step": 234080, "acc_step": 0, "speed/wps": 5514.376308525039, "speed/FLOPS": 243707207700189.1, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.056568894535303116, "optim/lr": 1.745589468998143e-05, "optim/total_tokens": 1963605360640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.282222867012024, "created_at": "2025-06-03T07:02:37.769110+00:00"} {"global_step": 234081, "acc_step": 0, "speed/wps": 5503.558886266293, "speed/FLOPS": 243229133004938.9, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.07 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.07, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04353072866797447, "optim/lr": 1.7452347464886885e-05, "optim/total_tokens": 1963613749248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2843661308288574, "created_at": "2025-06-03T07:02:40.750776+00:00"} {"global_step": 234082, "acc_step": 0, "speed/wps": 5526.139228216685, "speed/FLOPS": 244227068542478.88, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05395020171999931, "optim/lr": 1.744880023979234e-05, "optim/total_tokens": 1963622137856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2834163904190063, "created_at": "2025-06-03T07:02:43.722430+00:00"} {"global_step": 234083, "acc_step": 0, "speed/wps": 5527.340033830333, "speed/FLOPS": 244280138004321.78, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04670664668083191, "optim/lr": 1.7445253014698016e-05, "optim/total_tokens": 1963630526464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2994558811187744, "created_at": "2025-06-03T07:02:46.695190+00:00"} {"global_step": 234084, "acc_step": 0, "speed/wps": 5530.974693067106, "speed/FLOPS": 244440771338714.72, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.55, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05244045704603195, "optim/lr": 1.744170578960347e-05, "optim/total_tokens": 1963638915072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2866727113723755, "created_at": "2025-06-03T07:02:49.661923+00:00"} {"global_step": 234085, "acc_step": 0, "speed/wps": 5504.722465930321, "speed/FLOPS": 243280557270348.34, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.050242844969034195, "optim/lr": 1.7438158564508923e-05, "optim/total_tokens": 1963647303680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2681403160095215, "created_at": "2025-06-03T07:02:52.643271+00:00"} {"global_step": 234086, "acc_step": 0, "speed/wps": 5524.3725038704615, "speed/FLOPS": 244148988369290.75, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04725874215364456, "optim/lr": 1.7434611339414373e-05, "optim/total_tokens": 1963655692288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2761672735214233, "created_at": "2025-06-03T07:02:55.616636+00:00"} {"global_step": 234087, "acc_step": 0, "speed/wps": 5517.347311501381, "speed/FLOPS": 243838510824771.62, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048858948051929474, "optim/lr": 1.743106411432005e-05, "optim/total_tokens": 1963664080896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2656025886535645, "created_at": "2025-06-03T07:02:58.595171+00:00"} {"global_step": 234088, "acc_step": 0, "speed/wps": 5518.463736778558, "speed/FLOPS": 243887851107640.25, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04441942647099495, "optim/lr": 1.7427516889225504e-05, "optim/total_tokens": 1963672469504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2816765308380127, "created_at": "2025-06-03T07:03:01.569743+00:00"} {"global_step": 234089, "acc_step": 0, "speed/wps": 5506.310435233482, "speed/FLOPS": 243350737385584.34, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.06 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.06, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05413580313324928, "optim/lr": 1.7423969664130958e-05, "optim/total_tokens": 1963680858112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2804228067398071, "created_at": "2025-06-03T07:03:04.550525+00:00"} {"global_step": 234090, "acc_step": 0, "speed/wps": 5519.015675145715, "speed/FLOPS": 243912243958391.94, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04934287443757057, "optim/lr": 1.742042243903641e-05, "optim/total_tokens": 1963689246720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2731108665466309, "created_at": "2025-06-03T07:03:07.528008+00:00"} {"global_step": 234091, "acc_step": 0, "speed/wps": 5525.006527129228, "speed/FLOPS": 244177008952103.0, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04924272745847702, "optim/lr": 1.7416875213942085e-05, "optim/total_tokens": 1963697635328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2783595323562622, "created_at": "2025-06-03T07:03:10.500064+00:00"} {"global_step": 234092, "acc_step": 0, "speed/wps": 5514.017992634679, "speed/FLOPS": 243691371971862.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.05 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.05, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05860232934355736, "optim/lr": 1.741332798884754e-05, "optim/total_tokens": 1963706023936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2812881469726562, "created_at": "2025-06-03T07:03:13.477773+00:00"} {"global_step": 234093, "acc_step": 0, "speed/wps": 5520.356115918186, "speed/FLOPS": 243971484579537.34, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04424314945936203, "optim/lr": 1.7409780763752992e-05, "optim/total_tokens": 1963714412544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2801475524902344, "created_at": "2025-06-03T07:03:16.449469+00:00"} {"global_step": 234094, "acc_step": 0, "speed/wps": 5526.439802897971, "speed/FLOPS": 244240352404911.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05793480947613716, "optim/lr": 1.7406233538658446e-05, "optim/total_tokens": 1963722801152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2660216093063354, "created_at": "2025-06-03T07:03:19.418394+00:00"} {"global_step": 234095, "acc_step": 0, "speed/wps": 5522.4196835688535, "speed/FLOPS": 244062683707400.1, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04361194372177124, "optim/lr": 1.740268631356412e-05, "optim/total_tokens": 1963731189760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.287755012512207, "created_at": "2025-06-03T07:03:22.392307+00:00"} {"global_step": 234096, "acc_step": 0, "speed/wps": 5430.949936018564, "speed/FLOPS": 240020189050287.2, "speed/curr_iter_time": 3.0158, "speed/data_load_time": 0.0007, "speed/curr_step_time": 3.0158, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "4.11 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 4.11, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05192474648356438, "optim/lr": 1.7399139088469573e-05, "optim/total_tokens": 1963739578368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2817926406860352, "created_at": "2025-06-03T07:03:25.418494+00:00"} {"global_step": 234097, "acc_step": 0, "speed/wps": 5514.7717228673155, "speed/FLOPS": 243724682990203.62, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05580970644950867, "optim/lr": 1.7395591863375027e-05, "optim/total_tokens": 1963747966976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2787401676177979, "created_at": "2025-06-03T07:03:28.392568+00:00"} {"global_step": 234098, "acc_step": 0, "speed/wps": 5515.855310847128, "speed/FLOPS": 243772572032605.28, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05106792598962784, "optim/lr": 1.739204463828048e-05, "optim/total_tokens": 1963756355584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2710111141204834, "created_at": "2025-06-03T07:03:31.369430+00:00"} {"global_step": 234099, "acc_step": 0, "speed/wps": 5524.709271664682, "speed/FLOPS": 244163871782061.47, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05714989826083183, "optim/lr": 1.7388497413186154e-05, "optim/total_tokens": 1963764744192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2760287523269653, "created_at": "2025-06-03T07:03:34.342752+00:00"} {"global_step": 234100, "acc_step": 0, "speed/wps": 5527.025746521886, "speed/FLOPS": 244266248113956.7, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05008689686655998, "optim/lr": 1.7384950188091608e-05, "optim/total_tokens": 1963773132800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2793924808502197, "created_at": "2025-06-03T07:03:37.310667+00:00"} {"global_step": 234101, "acc_step": 0, "speed/wps": 5515.62732667675, "speed/FLOPS": 243762496299203.34, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05030239000916481, "optim/lr": 1.738140296299706e-05, "optim/total_tokens": 1963781521408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2752423286437988, "created_at": "2025-06-03T07:03:40.289997+00:00"} {"global_step": 234102, "acc_step": 0, "speed/wps": 5509.471071472511, "speed/FLOPS": 243490421329746.6, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.049728598445653915, "optim/lr": 1.7377855737902735e-05, "optim/total_tokens": 1963789910016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2669625282287598, "created_at": "2025-06-03T07:03:43.270401+00:00"} {"global_step": 234103, "acc_step": 0, "speed/wps": 5512.273656400733, "speed/FLOPS": 243614281238643.94, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047565653920173645, "optim/lr": 1.737430851280819e-05, "optim/total_tokens": 1963798298624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2767996788024902, "created_at": "2025-06-03T07:03:46.251767+00:00"} {"global_step": 234104, "acc_step": 0, "speed/wps": 5514.946267685995, "speed/FLOPS": 243732396977787.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04995949938893318, "optim/lr": 1.7370761287713643e-05, "optim/total_tokens": 1963806687232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.270492434501648, "created_at": "2025-06-03T07:03:49.227471+00:00"} {"global_step": 234105, "acc_step": 0, "speed/wps": 5516.603014806325, "speed/FLOPS": 243805616720505.97, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.052863284945487976, "optim/lr": 1.7367214062619096e-05, "optim/total_tokens": 1963815075840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2549726963043213, "created_at": "2025-06-03T07:03:52.201169+00:00"} {"global_step": 234106, "acc_step": 0, "speed/wps": 5510.207752345006, "speed/FLOPS": 243522978853636.38, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04551136493682861, "optim/lr": 1.7363666837524774e-05, "optim/total_tokens": 1963823464448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2634862661361694, "created_at": "2025-06-03T07:03:55.178616+00:00"} {"global_step": 234107, "acc_step": 0, "speed/wps": 5530.194562214774, "speed/FLOPS": 244406293548113.3, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.51, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05587143450975418, "optim/lr": 1.7360119612430224e-05, "optim/total_tokens": 1963831853056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2579371929168701, "created_at": "2025-06-03T07:03:58.144921+00:00"} {"global_step": 234108, "acc_step": 0, "speed/wps": 5525.839726352273, "speed/FLOPS": 244213832093061.34, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046092256903648376, "optim/lr": 1.7356572387335677e-05, "optim/total_tokens": 1963840241664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2651139497756958, "created_at": "2025-06-03T07:04:01.115551+00:00"} {"global_step": 234109, "acc_step": 0, "speed/wps": 5512.604350153379, "speed/FLOPS": 243628896209866.84, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04736322909593582, "optim/lr": 1.735302516224113e-05, "optim/total_tokens": 1963848630272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2740166187286377, "created_at": "2025-06-03T07:04:04.094423+00:00"} {"global_step": 234110, "acc_step": 0, "speed/wps": 5523.409198627065, "speed/FLOPS": 244106415208175.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0536479614675045, "optim/lr": 1.7349477937146808e-05, "optim/total_tokens": 1963857018880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2690788507461548, "created_at": "2025-06-03T07:04:07.063566+00:00"} {"global_step": 234111, "acc_step": 0, "speed/wps": 5517.750820032247, "speed/FLOPS": 243856343836492.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04431020841002464, "optim/lr": 1.7345930712052262e-05, "optim/total_tokens": 1963865407488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2601544857025146, "created_at": "2025-06-03T07:04:10.036788+00:00"} {"global_step": 234112, "acc_step": 0, "speed/wps": 5497.237916181948, "speed/FLOPS": 242949778480868.7, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "4.04 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 4.04, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05559016391634941, "optim/lr": 1.7342383486957712e-05, "optim/total_tokens": 1963873796096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2496377229690552, "created_at": "2025-06-03T07:04:13.025578+00:00"} {"global_step": 234113, "acc_step": 0, "speed/wps": 5512.228942670561, "speed/FLOPS": 243612305120635.97, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046576689928770065, "optim/lr": 1.7338836261863166e-05, "optim/total_tokens": 1963882184704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2695034742355347, "created_at": "2025-06-03T07:04:16.004952+00:00"} {"global_step": 234114, "acc_step": 0, "speed/wps": 5515.180552286077, "speed/FLOPS": 243742751157934.22, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.06057807430624962, "optim/lr": 1.7335289036768843e-05, "optim/total_tokens": 1963890573312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2639135122299194, "created_at": "2025-06-03T07:04:18.980248+00:00"} {"global_step": 234115, "acc_step": 0, "speed/wps": 5517.73318539625, "speed/FLOPS": 243855564475843.2, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04776083305478096, "optim/lr": 1.7331741811674296e-05, "optim/total_tokens": 1963898961920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2809909582138062, "created_at": "2025-06-03T07:04:21.957419+00:00"} {"global_step": 234116, "acc_step": 0, "speed/wps": 5523.289951055997, "speed/FLOPS": 244101145075899.03, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.061257146298885345, "optim/lr": 1.732819458657975e-05, "optim/total_tokens": 1963907350528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2643383741378784, "created_at": "2025-06-03T07:04:24.930836+00:00"} {"global_step": 234117, "acc_step": 0, "speed/wps": 5517.04776266492, "speed/FLOPS": 243825272299429.97, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047015558928251266, "optim/lr": 1.73246473614852e-05, "optim/total_tokens": 1963915739136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.269608497619629, "created_at": "2025-06-03T07:04:27.908360+00:00"} {"global_step": 234118, "acc_step": 0, "speed/wps": 5514.652656937974, "speed/FLOPS": 243719420885561.4, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.050595227628946304, "optim/lr": 1.7321100136390877e-05, "optim/total_tokens": 1963924127744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2707993984222412, "created_at": "2025-06-03T07:04:30.886997+00:00"} {"global_step": 234119, "acc_step": 0, "speed/wps": 5517.090320897502, "speed/FLOPS": 243827153155477.34, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04668634757399559, "optim/lr": 1.731755291129633e-05, "optim/total_tokens": 1963932516352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2660974264144897, "created_at": "2025-06-03T07:04:33.864350+00:00"} {"global_step": 234120, "acc_step": 0, "speed/wps": 5519.693329068034, "speed/FLOPS": 243942192793211.22, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04515133425593376, "optim/lr": 1.7314005686201785e-05, "optim/total_tokens": 1963940904960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2685294151306152, "created_at": "2025-06-03T07:04:36.838908+00:00"} {"global_step": 234121, "acc_step": 0, "speed/wps": 5517.490784716728, "speed/FLOPS": 243844851606527.47, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0510983020067215, "optim/lr": 1.7310458461107238e-05, "optim/total_tokens": 1963949293568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2822142839431763, "created_at": "2025-06-03T07:04:39.811206+00:00"} {"global_step": 234122, "acc_step": 0, "speed/wps": 5500.418245929798, "speed/FLOPS": 243090332777320.34, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04630902782082558, "optim/lr": 1.7306911236012912e-05, "optim/total_tokens": 1963957682176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2798612117767334, "created_at": "2025-06-03T07:04:42.793717+00:00"} {"global_step": 234123, "acc_step": 0, "speed/wps": 5507.85675051688, "speed/FLOPS": 243419076606351.44, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045813918113708496, "optim/lr": 1.7303364010918366e-05, "optim/total_tokens": 1963966070784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2665328979492188, "created_at": "2025-06-03T07:04:45.776043+00:00"} {"global_step": 234124, "acc_step": 0, "speed/wps": 5508.657984875097, "speed/FLOPS": 243454487063895.4, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.03 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.03, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04443971440196037, "optim/lr": 1.729981678582382e-05, "optim/total_tokens": 1963974459392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.264644742012024, "created_at": "2025-06-03T07:04:48.756681+00:00"} {"global_step": 234125, "acc_step": 0, "speed/wps": 5527.199274034873, "speed/FLOPS": 244273917141836.44, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.59, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04487365856766701, "optim/lr": 1.7296269560729273e-05, "optim/total_tokens": 1963982848000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2548902034759521, "created_at": "2025-06-03T07:04:51.724951+00:00"} {"global_step": 234126, "acc_step": 0, "speed/wps": 5535.345666904604, "speed/FLOPS": 244633946009659.88, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.39, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04624268040060997, "optim/lr": 1.7292722335634947e-05, "optim/total_tokens": 1963991236608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2786571979522705, "created_at": "2025-06-03T07:04:54.689191+00:00"} {"global_step": 234127, "acc_step": 0, "speed/wps": 5513.225669675204, "speed/FLOPS": 243656355352529.9, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0447666309773922, "optim/lr": 1.72891751105404e-05, "optim/total_tokens": 1963999625216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.27456533908844, "created_at": "2025-06-03T07:04:57.668260+00:00"} {"global_step": 234128, "acc_step": 0, "speed/wps": 5528.742543412668, "speed/FLOPS": 244342121749166.2, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04624195769429207, "optim/lr": 1.7285627885445854e-05, "optim/total_tokens": 1964008013824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2763701677322388, "created_at": "2025-06-03T07:05:00.635357+00:00"} {"global_step": 234129, "acc_step": 0, "speed/wps": 5518.983263943537, "speed/FLOPS": 243910811549151.25, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045601144433021545, "optim/lr": 1.7282080660351528e-05, "optim/total_tokens": 1964016402432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2705425024032593, "created_at": "2025-06-03T07:05:03.607665+00:00"} {"global_step": 234130, "acc_step": 0, "speed/wps": 5515.446626500943, "speed/FLOPS": 243754510276340.03, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04649647697806358, "optim/lr": 1.727853343525698e-05, "optim/total_tokens": 1964024791040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2757035493850708, "created_at": "2025-06-03T07:05:06.581672+00:00"} {"global_step": 234131, "acc_step": 0, "speed/wps": 5513.42224122295, "speed/FLOPS": 243665042808795.9, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04623357951641083, "optim/lr": 1.7274986210162435e-05, "optim/total_tokens": 1964033179648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2789067029953003, "created_at": "2025-06-03T07:05:09.556871+00:00"} {"global_step": 234132, "acc_step": 0, "speed/wps": 5515.566052251279, "speed/FLOPS": 243759788283228.47, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04646926745772362, "optim/lr": 1.727143898506789e-05, "optim/total_tokens": 1964041568256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2838712930679321, "created_at": "2025-06-03T07:05:12.530963+00:00"} {"global_step": 234133, "acc_step": 0, "speed/wps": 5519.444320727099, "speed/FLOPS": 243931187899082.12, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046906739473342896, "optim/lr": 1.7267891759973562e-05, "optim/total_tokens": 1964049956864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2675758600234985, "created_at": "2025-06-03T07:05:15.505843+00:00"} {"global_step": 234134, "acc_step": 0, "speed/wps": 5523.436375557597, "speed/FLOPS": 244107616289401.2, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04834604635834694, "optim/lr": 1.7264344534879016e-05, "optim/total_tokens": 1964058345472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2592986822128296, "created_at": "2025-06-03T07:05:18.475319+00:00"} {"global_step": 234135, "acc_step": 0, "speed/wps": 5516.061622797055, "speed/FLOPS": 243781689964791.75, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04503726586699486, "optim/lr": 1.726079730978447e-05, "optim/total_tokens": 1964066734080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.271859884262085, "created_at": "2025-06-03T07:05:21.448918+00:00"} {"global_step": 234136, "acc_step": 0, "speed/wps": 5521.493937174431, "speed/FLOPS": 244021770455166.22, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047530874609947205, "optim/lr": 1.7257250084689923e-05, "optim/total_tokens": 1964075122688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2871507406234741, "created_at": "2025-06-03T07:05:24.419920+00:00"} {"global_step": 234137, "acc_step": 0, "speed/wps": 5512.611715812466, "speed/FLOPS": 243629221734297.62, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04672017693519592, "optim/lr": 1.72537028595956e-05, "optim/total_tokens": 1964083511296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2595962285995483, "created_at": "2025-06-03T07:05:27.395767+00:00"} {"global_step": 234138, "acc_step": 0, "speed/wps": 5517.309847787019, "speed/FLOPS": 243836855120353.5, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047427449375391006, "optim/lr": 1.725015563450105e-05, "optim/total_tokens": 1964091899904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.270875334739685, "created_at": "2025-06-03T07:05:30.368928+00:00"} {"global_step": 234139, "acc_step": 0, "speed/wps": 5493.558318982084, "speed/FLOPS": 242787159118520.5, "speed/curr_iter_time": 2.9793, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9793, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "4.02 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 4.02, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04993186146020889, "optim/lr": 1.7246608409406504e-05, "optim/total_tokens": 1964100288512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2543034553527832, "created_at": "2025-06-03T07:05:33.357938+00:00"} {"global_step": 234140, "acc_step": 0, "speed/wps": 5511.804979618267, "speed/FLOPS": 243593568123764.2, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04524630308151245, "optim/lr": 1.7243061184311958e-05, "optim/total_tokens": 1964108677120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2812132835388184, "created_at": "2025-06-03T07:05:36.338374+00:00"} {"global_step": 234141, "acc_step": 0, "speed/wps": 5512.782355780348, "speed/FLOPS": 243636763147463.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.01 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.01, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04802507534623146, "optim/lr": 1.7239513959217635e-05, "optim/total_tokens": 1964117065728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.269251823425293, "created_at": "2025-06-03T07:05:39.314199+00:00"} {"global_step": 234142, "acc_step": 0, "speed/wps": 5520.691363371339, "speed/FLOPS": 243986300801014.66, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048094864934682846, "optim/lr": 1.723596673412309e-05, "optim/total_tokens": 1964125454336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2817697525024414, "created_at": "2025-06-03T07:05:42.285352+00:00"} {"global_step": 234143, "acc_step": 0, "speed/wps": 5517.32753552142, "speed/FLOPS": 243837636827680.0, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046494219452142715, "optim/lr": 1.7232419509028542e-05, "optim/total_tokens": 1964133842944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2859771251678467, "created_at": "2025-06-03T07:05:45.261749+00:00"} {"global_step": 234144, "acc_step": 0, "speed/wps": 5533.040002832162, "speed/FLOPS": 244532047459116.5, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.49, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0459388829767704, "optim/lr": 1.7228872283933993e-05, "optim/total_tokens": 1964142231552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2694511413574219, "created_at": "2025-06-03T07:05:48.228758+00:00"} {"global_step": 234145, "acc_step": 0, "speed/wps": 5517.703265743961, "speed/FLOPS": 243854242180354.7, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04477249085903168, "optim/lr": 1.722532505883967e-05, "optim/total_tokens": 1964150620160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2680176496505737, "created_at": "2025-06-03T07:05:51.206017+00:00"} {"global_step": 234146, "acc_step": 0, "speed/wps": 5512.560905861632, "speed/FLOPS": 243626976194539.66, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04593538120388985, "optim/lr": 1.7221777833745123e-05, "optim/total_tokens": 1964159008768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2720099687576294, "created_at": "2025-06-03T07:05:54.181563+00:00"} {"global_step": 234147, "acc_step": 0, "speed/wps": 5514.916242967116, "speed/FLOPS": 243731070038893.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04471759870648384, "optim/lr": 1.7218230608650577e-05, "optim/total_tokens": 1964167397376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2757823467254639, "created_at": "2025-06-03T07:05:57.155433+00:00"} {"global_step": 234148, "acc_step": 0, "speed/wps": 5511.362290849952, "speed/FLOPS": 243574003546091.2, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04509592428803444, "optim/lr": 1.721468338355603e-05, "optim/total_tokens": 1964175785984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.256964087486267, "created_at": "2025-06-03T07:06:00.131593+00:00"} {"global_step": 234149, "acc_step": 0, "speed/wps": 5517.025476616221, "speed/FLOPS": 243824287370147.8, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046669069677591324, "optim/lr": 1.7211136158461704e-05, "optim/total_tokens": 1964184174592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2695904970169067, "created_at": "2025-06-03T07:06:03.106969+00:00"} {"global_step": 234150, "acc_step": 0, "speed/wps": 5524.208908348026, "speed/FLOPS": 244141758284556.88, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.75, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.047355905175209045, "optim/lr": 1.7207588933367158e-05, "optim/total_tokens": 1964192563200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2783849239349365, "created_at": "2025-06-03T07:06:06.076195+00:00"} {"global_step": 234151, "acc_step": 0, "speed/wps": 5522.541764032652, "speed/FLOPS": 244068079039035.53, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04560178890824318, "optim/lr": 1.720404170827261e-05, "optim/total_tokens": 1964200951808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2782313823699951, "created_at": "2025-06-03T07:06:09.046081+00:00"} {"global_step": 234152, "acc_step": 0, "speed/wps": 5520.5125378348275, "speed/FLOPS": 243978397627612.9, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045067477971315384, "optim/lr": 1.7200494483178065e-05, "optim/total_tokens": 1964209340416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2785180807113647, "created_at": "2025-06-03T07:06:12.017219+00:00"} {"global_step": 234153, "acc_step": 0, "speed/wps": 5521.109426231296, "speed/FLOPS": 244004777039585.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045355796813964844, "optim/lr": 1.719694725808374e-05, "optim/total_tokens": 1964217729024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2783517837524414, "created_at": "2025-06-03T07:06:14.990928+00:00"} {"global_step": 234154, "acc_step": 0, "speed/wps": 5510.498639577341, "speed/FLOPS": 243535834580409.75, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04388340935111046, "optim/lr": 1.7193400032989193e-05, "optim/total_tokens": 1964226117632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2772529125213623, "created_at": "2025-06-03T07:06:17.972259+00:00"} {"global_step": 234155, "acc_step": 0, "speed/wps": 5511.206969737907, "speed/FLOPS": 243567139147944.3, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045086368918418884, "optim/lr": 1.7189852807894646e-05, "optim/total_tokens": 1964234506240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.272141456604004, "created_at": "2025-06-03T07:06:20.950042+00:00"} {"global_step": 234156, "acc_step": 0, "speed/wps": 5514.591676860573, "speed/FLOPS": 243716725878264.62, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05676647648215294, "optim/lr": 1.718630558280032e-05, "optim/total_tokens": 1964242894848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2775708436965942, "created_at": "2025-06-03T07:06:23.930035+00:00"} {"global_step": 234157, "acc_step": 0, "speed/wps": 5506.1261525292075, "speed/FLOPS": 243342593033299.78, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "4.0 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 4.0, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04610510915517807, "optim/lr": 1.7182758357705774e-05, "optim/total_tokens": 1964251283456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2655799388885498, "created_at": "2025-06-03T07:06:26.913245+00:00"} {"global_step": 234158, "acc_step": 0, "speed/wps": 5520.990467666926, "speed/FLOPS": 243999519679925.03, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04564465582370758, "optim/lr": 1.7179211132611227e-05, "optim/total_tokens": 1964259672064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.280709981918335, "created_at": "2025-06-03T07:06:29.886506+00:00"} {"global_step": 234159, "acc_step": 0, "speed/wps": 5519.878768295147, "speed/FLOPS": 243950388257885.62, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04542922601103783, "optim/lr": 1.717566390751668e-05, "optim/total_tokens": 1964268060672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2843286991119385, "created_at": "2025-06-03T07:06:32.862598+00:00"} {"global_step": 234160, "acc_step": 0, "speed/wps": 5527.287692098394, "speed/FLOPS": 244277824767679.34, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048212599009275436, "optim/lr": 1.7172116682422355e-05, "optim/total_tokens": 1964276449280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2662922143936157, "created_at": "2025-06-03T07:06:35.831054+00:00"} {"global_step": 234161, "acc_step": 0, "speed/wps": 5517.524395789913, "speed/FLOPS": 243846337043925.2, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04569351673126221, "optim/lr": 1.716856945732781e-05, "optim/total_tokens": 1964284837888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2844009399414062, "created_at": "2025-06-03T07:06:38.805473+00:00"} {"global_step": 234162, "acc_step": 0, "speed/wps": 5523.658016802629, "speed/FLOPS": 244117411697968.9, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04796300455927849, "optim/lr": 1.7165022232233262e-05, "optim/total_tokens": 1964293226496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2594897747039795, "created_at": "2025-06-03T07:06:41.775431+00:00"} {"global_step": 234163, "acc_step": 0, "speed/wps": 5510.321109332943, "speed/FLOPS": 243527988652289.5, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044259462505578995, "optim/lr": 1.7161475007138716e-05, "optim/total_tokens": 1964301615104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2648365497589111, "created_at": "2025-06-03T07:06:44.753408+00:00"} {"global_step": 234164, "acc_step": 0, "speed/wps": 5518.083541264907, "speed/FLOPS": 243871048411953.9, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04930533468723297, "optim/lr": 1.7157927782044393e-05, "optim/total_tokens": 1964310003712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.261688470840454, "created_at": "2025-06-03T07:06:47.726089+00:00"} {"global_step": 234165, "acc_step": 0, "speed/wps": 5507.878296055436, "speed/FLOPS": 243420028808875.53, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04523760825395584, "optim/lr": 1.7154380556949843e-05, "optim/total_tokens": 1964318392320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2660894393920898, "created_at": "2025-06-03T07:06:50.704928+00:00"} {"global_step": 234166, "acc_step": 0, "speed/wps": 5523.6685962850825, "speed/FLOPS": 244117879256942.62, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046865932643413544, "optim/lr": 1.7150833331855297e-05, "optim/total_tokens": 1964326780928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2679442167282104, "created_at": "2025-06-03T07:06:53.678454+00:00"} {"global_step": 234167, "acc_step": 0, "speed/wps": 5527.434574821457, "speed/FLOPS": 244284316232224.84, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04975130781531334, "optim/lr": 1.714728610676075e-05, "optim/total_tokens": 1964335169536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2644569873809814, "created_at": "2025-06-03T07:06:56.650117+00:00"} {"global_step": 234168, "acc_step": 0, "speed/wps": 5519.809830862089, "speed/FLOPS": 243947341576198.22, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048673320561647415, "optim/lr": 1.7143738881666428e-05, "optim/total_tokens": 1964343558144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2685073614120483, "created_at": "2025-06-03T07:06:59.622216+00:00"} {"global_step": 234169, "acc_step": 0, "speed/wps": 5518.780047915469, "speed/FLOPS": 243901830440864.56, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04510883986949921, "optim/lr": 1.714019165657188e-05, "optim/total_tokens": 1964351946752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2715036869049072, "created_at": "2025-06-03T07:07:02.594253+00:00"} {"global_step": 234170, "acc_step": 0, "speed/wps": 5513.82955457215, "speed/FLOPS": 243683043974011.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046086687594652176, "optim/lr": 1.713664443147733e-05, "optim/total_tokens": 1964360335360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2800742387771606, "created_at": "2025-06-03T07:07:05.573969+00:00"} {"global_step": 234171, "acc_step": 0, "speed/wps": 5511.430331519947, "speed/FLOPS": 243577010595441.25, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04663063585758209, "optim/lr": 1.7133097206382785e-05, "optim/total_tokens": 1964368723968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2767020463943481, "created_at": "2025-06-03T07:07:08.554906+00:00"} {"global_step": 234172, "acc_step": 0, "speed/wps": 5511.666342605188, "speed/FLOPS": 243587441077394.7, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04580773040652275, "optim/lr": 1.7129549981288462e-05, "optim/total_tokens": 1964377112576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.28143310546875, "created_at": "2025-06-03T07:07:11.532590+00:00"} {"global_step": 234173, "acc_step": 0, "speed/wps": 5504.418139104909, "speed/FLOPS": 243267107582351.0, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.99 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.99, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.048264600336551666, "optim/lr": 1.7126002756193916e-05, "optim/total_tokens": 1964385501184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2818355560302734, "created_at": "2025-06-03T07:07:14.514495+00:00"} {"global_step": 234174, "acc_step": 0, "speed/wps": 5523.130379677552, "speed/FLOPS": 244094092837732.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04541286453604698, "optim/lr": 1.712245553109937e-05, "optim/total_tokens": 1964393889792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2640460729599, "created_at": "2025-06-03T07:07:17.488610+00:00"} {"global_step": 234175, "acc_step": 0, "speed/wps": 5529.025468570622, "speed/FLOPS": 244354625593005.53, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04992794618010521, "optim/lr": 1.711890830600482e-05, "optim/total_tokens": 1964402278400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2865346670150757, "created_at": "2025-06-03T07:07:20.454969+00:00"} {"global_step": 234176, "acc_step": 0, "speed/wps": 5528.717579093539, "speed/FLOPS": 244341018454039.66, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04758032411336899, "optim/lr": 1.7115361080910497e-05, "optim/total_tokens": 1964410667008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2558432817459106, "created_at": "2025-06-03T07:07:23.425464+00:00"} {"global_step": 234177, "acc_step": 0, "speed/wps": 5532.372944732146, "speed/FLOPS": 244502566905408.66, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04487897455692291, "optim/lr": 1.711181385581595e-05, "optim/total_tokens": 1964419055616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2578076124191284, "created_at": "2025-06-03T07:07:26.394605+00:00"} {"global_step": 234178, "acc_step": 0, "speed/wps": 5520.004078420291, "speed/FLOPS": 243955926324021.62, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04835743084549904, "optim/lr": 1.7108266630721404e-05, "optim/total_tokens": 1964427444224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2672369480133057, "created_at": "2025-06-03T07:07:29.370473+00:00"} {"global_step": 234179, "acc_step": 0, "speed/wps": 5528.5622668336455, "speed/FLOPS": 244334154447112.6, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 192.6, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04572335630655289, "optim/lr": 1.7104719405626858e-05, "optim/total_tokens": 1964435832832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2694425582885742, "created_at": "2025-06-03T07:07:32.341875+00:00"} {"global_step": 234180, "acc_step": 0, "speed/wps": 5517.451499925376, "speed/FLOPS": 243843115419827.5, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.049302760511636734, "optim/lr": 1.710117218053253e-05, "optim/total_tokens": 1964444221440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2875006198883057, "created_at": "2025-06-03T07:07:35.316509+00:00"} {"global_step": 234181, "acc_step": 0, "speed/wps": 5520.104937200911, "speed/FLOPS": 243960383765883.0, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045910999178886414, "optim/lr": 1.7097624955437985e-05, "optim/total_tokens": 1964452610048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2841579914093018, "created_at": "2025-06-03T07:07:38.294036+00:00"} {"global_step": 234182, "acc_step": 0, "speed/wps": 5508.060761110152, "speed/FLOPS": 243428092830353.2, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.98 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.98, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044848911464214325, "optim/lr": 1.709407773034344e-05, "optim/total_tokens": 1964460998656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2692948579788208, "created_at": "2025-06-03T07:07:41.275017+00:00"} {"global_step": 234183, "acc_step": 0, "speed/wps": 5524.088661801688, "speed/FLOPS": 244136444002686.38, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044991958886384964, "optim/lr": 1.7090530505249113e-05, "optim/total_tokens": 1964469387264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2719330787658691, "created_at": "2025-06-03T07:07:44.244302+00:00"} {"global_step": 234184, "acc_step": 0, "speed/wps": 5525.783373683099, "speed/FLOPS": 244211341593522.97, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04535787180066109, "optim/lr": 1.7086983280154566e-05, "optim/total_tokens": 1964477775872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.278180718421936, "created_at": "2025-06-03T07:07:47.213388+00:00"} {"global_step": 234185, "acc_step": 0, "speed/wps": 5518.098414406606, "speed/FLOPS": 243871705728689.38, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.044801607728004456, "optim/lr": 1.708343605506002e-05, "optim/total_tokens": 1964486164480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2747650146484375, "created_at": "2025-06-03T07:07:50.189055+00:00"} {"global_step": 234186, "acc_step": 0, "speed/wps": 5530.662475216235, "speed/FLOPS": 244426972907782.06, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0485294871032238, "optim/lr": 1.7079888829965473e-05, "optim/total_tokens": 1964494553088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2714309692382812, "created_at": "2025-06-03T07:07:53.160166+00:00"} {"global_step": 234187, "acc_step": 0, "speed/wps": 5524.19501356395, "speed/FLOPS": 244141144206220.7, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04587441310286522, "optim/lr": 1.7076341604871147e-05, "optim/total_tokens": 1964502941696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.285352349281311, "created_at": "2025-06-03T07:07:56.129674+00:00"} {"global_step": 234188, "acc_step": 0, "speed/wps": 5517.277012353998, "speed/FLOPS": 243835403962280.94, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04951321333646774, "optim/lr": 1.70727943797766e-05, "optim/total_tokens": 1964511330304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.260579228401184, "created_at": "2025-06-03T07:07:59.106588+00:00"} {"global_step": 234189, "acc_step": 0, "speed/wps": 5513.142139920485, "speed/FLOPS": 243652663764915.34, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045206375420093536, "optim/lr": 1.7069247154682054e-05, "optim/total_tokens": 1964519718912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2574435472488403, "created_at": "2025-06-03T07:08:02.081895+00:00"} {"global_step": 234190, "acc_step": 0, "speed/wps": 5509.733217621202, "speed/FLOPS": 243502006847733.12, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04966185986995697, "optim/lr": 1.7065699929587508e-05, "optim/total_tokens": 1964528107520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.26962149143219, "created_at": "2025-06-03T07:08:05.059036+00:00"} {"global_step": 234191, "acc_step": 0, "speed/wps": 5528.198797888868, "speed/FLOPS": 244318090980156.16, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044710952788591385, "optim/lr": 1.7062152704493182e-05, "optim/total_tokens": 1964536496128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2540884017944336, "created_at": "2025-06-03T07:08:08.026201+00:00"} {"global_step": 234192, "acc_step": 0, "speed/wps": 5515.28136326026, "speed/FLOPS": 243747206486995.78, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05536587908864021, "optim/lr": 1.7058605479398635e-05, "optim/total_tokens": 1964544884736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.27153742313385, "created_at": "2025-06-03T07:08:11.004330+00:00"} {"global_step": 234193, "acc_step": 0, "speed/wps": 5517.884786201544, "speed/FLOPS": 243862264455473.9, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.04471419006586075, "optim/lr": 1.705505825430409e-05, "optim/total_tokens": 1964553273344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.263938069343567, "created_at": "2025-06-03T07:08:13.981463+00:00"} {"global_step": 234194, "acc_step": 0, "speed/wps": 5525.516776762917, "speed/FLOPS": 244199559374217.7, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.058385320007801056, "optim/lr": 1.7051511029209543e-05, "optim/total_tokens": 1964561661952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2723532915115356, "created_at": "2025-06-03T07:08:16.950690+00:00"} {"global_step": 234195, "acc_step": 0, "speed/wps": 5509.130561293744, "speed/FLOPS": 243475372522734.2, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.045385196805000305, "optim/lr": 1.704796380411522e-05, "optim/total_tokens": 1964570050560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2692331075668335, "created_at": "2025-06-03T07:08:19.928218+00:00"} {"global_step": 234196, "acc_step": 0, "speed/wps": 5426.737205369594, "speed/FLOPS": 239834007918312.94, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.054870083928108215, "optim/lr": 1.7044416579020673e-05, "optim/total_tokens": 1964578439168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2726043462753296, "created_at": "2025-06-03T07:08:22.956056+00:00"} {"global_step": 234197, "acc_step": 0, "speed/wps": 5507.1445704265325, "speed/FLOPS": 243387601891626.22, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.97 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.97, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.0454997755587101, "optim/lr": 1.7040869353926124e-05, "optim/total_tokens": 1964586827776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2838022708892822, "created_at": "2025-06-03T07:08:25.934948+00:00"} {"global_step": 234198, "acc_step": 0, "speed/wps": 5516.0233277653415, "speed/FLOPS": 243779997520401.78, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05126427114009857, "optim/lr": 1.7037322128831577e-05, "optim/total_tokens": 1964595216384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2789883613586426, "created_at": "2025-06-03T07:08:28.912342+00:00"} {"global_step": 234199, "acc_step": 0, "speed/wps": 5516.7495200670355, "speed/FLOPS": 243812091503147.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046370264142751694, "optim/lr": 1.7033774903737254e-05, "optim/total_tokens": 1964603604992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2761595249176025, "created_at": "2025-06-03T07:08:31.891554+00:00"} {"global_step": 234200, "acc_step": 0, "speed/wps": 5523.311646553125, "speed/FLOPS": 244102103905824.44, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05028849095106125, "optim/lr": 1.7030227678642708e-05, "optim/total_tokens": 1964611993600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2784104347229004, "created_at": "2025-06-03T07:08:34.866256+00:00"} {"global_step": 234201, "acc_step": 0, "speed/wps": 5519.698388670296, "speed/FLOPS": 243942416401733.8, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046533431857824326, "optim/lr": 1.7026680453548162e-05, "optim/total_tokens": 1964620382208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.28046715259552, "created_at": "2025-06-03T07:08:37.838048+00:00"} {"global_step": 234202, "acc_step": 0, "speed/wps": 5520.990268410649, "speed/FLOPS": 243999510873817.47, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04545174166560173, "optim/lr": 1.7023133228453612e-05, "optim/total_tokens": 1964628770816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2735822200775146, "created_at": "2025-06-03T07:08:40.811197+00:00"} {"global_step": 234203, "acc_step": 0, "speed/wps": 5515.786146585601, "speed/FLOPS": 243769515326260.6, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05161671340465546, "optim/lr": 1.701958600335929e-05, "optim/total_tokens": 1964637159424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2753502130508423, "created_at": "2025-06-03T07:08:43.785660+00:00"} {"global_step": 234204, "acc_step": 0, "speed/wps": 5513.025440847741, "speed/FLOPS": 243647506263220.1, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045177161693573, "optim/lr": 1.7016038778264743e-05, "optim/total_tokens": 1964645548032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2703857421875, "created_at": "2025-06-03T07:08:46.761480+00:00"} {"global_step": 234205, "acc_step": 0, "speed/wps": 5507.022655155913, "speed/FLOPS": 243382213860683.75, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.05109238997101784, "optim/lr": 1.7012491553170196e-05, "optim/total_tokens": 1964653936640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.257908821105957, "created_at": "2025-06-03T07:08:49.742661+00:00"} {"global_step": 234206, "acc_step": 0, "speed/wps": 5514.106469958296, "speed/FLOPS": 243695282216698.03, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04694667458534241, "optim/lr": 1.700894432807565e-05, "optim/total_tokens": 1964662325248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.266440510749817, "created_at": "2025-06-03T07:08:52.721666+00:00"} {"global_step": 234207, "acc_step": 0, "speed/wps": 5501.924251046715, "speed/FLOPS": 243156890495055.1, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.96 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.96, "speed/est_time_remaining_days": 0.17, "optim/grad_norm": 0.046301841735839844, "optim/lr": 1.7005397102981324e-05, "optim/total_tokens": 1964670713856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2817931175231934, "created_at": "2025-06-03T07:08:55.707097+00:00"} {"global_step": 234208, "acc_step": 0, "speed/wps": 5515.028670831711, "speed/FLOPS": 243736038775051.0, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046355947852134705, "optim/lr": 1.7001849877886777e-05, "optim/total_tokens": 1964679102464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2688419818878174, "created_at": "2025-06-03T07:08:58.683537+00:00"} {"global_step": 234209, "acc_step": 0, "speed/wps": 5514.574916359362, "speed/FLOPS": 243715985149899.1, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04481706768274307, "optim/lr": 1.699830265279223e-05, "optim/total_tokens": 1964687491072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2614980936050415, "created_at": "2025-06-03T07:09:01.662165+00:00"} {"global_step": 234210, "acc_step": 0, "speed/wps": 5526.0758318327125, "speed/FLOPS": 244224266746799.38, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.69, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04552885517477989, "optim/lr": 1.6994755427697905e-05, "optim/total_tokens": 1964695879680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.25971257686615, "created_at": "2025-06-03T07:09:04.630690+00:00"} {"global_step": 234211, "acc_step": 0, "speed/wps": 5513.568096335365, "speed/FLOPS": 243671488858210.5, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045122500509023666, "optim/lr": 1.699120820260336e-05, "optim/total_tokens": 1964704268288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2662074565887451, "created_at": "2025-06-03T07:09:07.605832+00:00"} {"global_step": 234212, "acc_step": 0, "speed/wps": 5523.63385497758, "speed/FLOPS": 244116343868973.16, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04787948355078697, "optim/lr": 1.6987660977508812e-05, "optim/total_tokens": 1964712656896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2888849973678589, "created_at": "2025-06-03T07:09:10.574999+00:00"} {"global_step": 234213, "acc_step": 0, "speed/wps": 5510.372073904571, "speed/FLOPS": 243530241025495.16, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046345509588718414, "optim/lr": 1.6984113752414266e-05, "optim/total_tokens": 1964721045504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2874127626419067, "created_at": "2025-06-03T07:09:13.555494+00:00"} {"global_step": 234214, "acc_step": 0, "speed/wps": 5514.261470151555, "speed/FLOPS": 243702132431877.16, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046658068895339966, "optim/lr": 1.698056652731994e-05, "optim/total_tokens": 1964729434112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2711939811706543, "created_at": "2025-06-03T07:09:16.529842+00:00"} {"global_step": 234215, "acc_step": 0, "speed/wps": 5516.2852113483295, "speed/FLOPS": 243791571434328.16, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04766092076897621, "optim/lr": 1.6977019302225393e-05, "optim/total_tokens": 1964737822720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2627854347229004, "created_at": "2025-06-03T07:09:19.503482+00:00"} {"global_step": 234216, "acc_step": 0, "speed/wps": 5515.192747945595, "speed/FLOPS": 243743290143661.9, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04987889155745506, "optim/lr": 1.6973472077130847e-05, "optim/total_tokens": 1964746211328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2860502004623413, "created_at": "2025-06-03T07:09:22.477666+00:00"} {"global_step": 234217, "acc_step": 0, "speed/wps": 5524.115900927018, "speed/FLOPS": 244137647832603.47, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04650544375181198, "optim/lr": 1.69699248520363e-05, "optim/total_tokens": 1964754599936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2675954103469849, "created_at": "2025-06-03T07:09:25.452014+00:00"} {"global_step": 234218, "acc_step": 0, "speed/wps": 5521.605386893311, "speed/FLOPS": 244026695962289.34, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05090546980500221, "optim/lr": 1.6966377626941974e-05, "optim/total_tokens": 1964762988544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.262571096420288, "created_at": "2025-06-03T07:09:28.423841+00:00"} {"global_step": 234219, "acc_step": 0, "speed/wps": 5522.907676733407, "speed/FLOPS": 244084250507497.9, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04572010785341263, "optim/lr": 1.6962830401847428e-05, "optim/total_tokens": 1964771377152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2644762992858887, "created_at": "2025-06-03T07:09:31.398008+00:00"} {"global_step": 234220, "acc_step": 0, "speed/wps": 5518.49835941652, "speed/FLOPS": 243889381251023.44, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.050989553332328796, "optim/lr": 1.695928317675288e-05, "optim/total_tokens": 1964779765760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2635374069213867, "created_at": "2025-06-03T07:09:34.371150+00:00"} {"global_step": 234221, "acc_step": 0, "speed/wps": 5516.823528835433, "speed/FLOPS": 243815362311899.44, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044388726353645325, "optim/lr": 1.6955735951658335e-05, "optim/total_tokens": 1964788154368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2605955600738525, "created_at": "2025-06-03T07:09:37.348452+00:00"} {"global_step": 234222, "acc_step": 0, "speed/wps": 5519.021486676661, "speed/FLOPS": 243912500798313.62, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04620153829455376, "optim/lr": 1.6952188726564012e-05, "optim/total_tokens": 1964796542976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2701475620269775, "created_at": "2025-06-03T07:09:40.324504+00:00"} {"global_step": 234223, "acc_step": 0, "speed/wps": 5498.142768857342, "speed/FLOPS": 242989768337665.28, "speed/curr_iter_time": 2.9771, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9771, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.95 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.95, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044832032173871994, "optim/lr": 1.6948641501469462e-05, "optim/total_tokens": 1964804931584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2907530069351196, "created_at": "2025-06-03T07:09:43.308740+00:00"} {"global_step": 234224, "acc_step": 0, "speed/wps": 5515.208117734809, "speed/FLOPS": 243743969409675.44, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044693127274513245, "optim/lr": 1.6945094276374916e-05, "optim/total_tokens": 1964813320192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.285348653793335, "created_at": "2025-06-03T07:09:46.283775+00:00"} {"global_step": 234225, "acc_step": 0, "speed/wps": 5515.5903575441835, "speed/FLOPS": 243760862452769.06, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04445553943514824, "optim/lr": 1.694154705128037e-05, "optim/total_tokens": 1964821708800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2677093744277954, "created_at": "2025-06-03T07:09:49.258406+00:00"} {"global_step": 234226, "acc_step": 0, "speed/wps": 5521.586331648544, "speed/FLOPS": 244025853818004.2, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04496163874864578, "optim/lr": 1.6937999826186047e-05, "optim/total_tokens": 1964830097408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2611560821533203, "created_at": "2025-06-03T07:09:52.231195+00:00"} {"global_step": 234227, "acc_step": 0, "speed/wps": 5516.863895063881, "speed/FLOPS": 243817146292583.75, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044808242470026016, "optim/lr": 1.69344526010915e-05, "optim/total_tokens": 1964838486016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.278651237487793, "created_at": "2025-06-03T07:09:55.204473+00:00"} {"global_step": 234228, "acc_step": 0, "speed/wps": 5521.368637811839, "speed/FLOPS": 244016232864679.9, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04701470211148262, "optim/lr": 1.693090537599695e-05, "optim/total_tokens": 1964846874624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.277077317237854, "created_at": "2025-06-03T07:09:58.174642+00:00"} {"global_step": 234229, "acc_step": 0, "speed/wps": 5511.04033072308, "speed/FLOPS": 243559774556424.78, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.36, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04853168502449989, "optim/lr": 1.6927358150902404e-05, "optim/total_tokens": 1964855263232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2708708047866821, "created_at": "2025-06-03T07:10:01.150807+00:00"} {"global_step": 234230, "acc_step": 0, "speed/wps": 5518.674761062867, "speed/FLOPS": 243897177300886.53, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045554373413324356, "optim/lr": 1.692381092580808e-05, "optim/total_tokens": 1964863651840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2787786722183228, "created_at": "2025-06-03T07:10:04.126108+00:00"} {"global_step": 234231, "acc_step": 0, "speed/wps": 5509.207216796889, "speed/FLOPS": 243478760303614.78, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044611066579818726, "optim/lr": 1.6920263700713535e-05, "optim/total_tokens": 1964872040448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2735992670059204, "created_at": "2025-06-03T07:10:07.105695+00:00"} {"global_step": 234232, "acc_step": 0, "speed/wps": 5512.452192978137, "speed/FLOPS": 243622171641532.16, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04666151478886604, "optim/lr": 1.691671647561899e-05, "optim/total_tokens": 1964880429056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2783153057098389, "created_at": "2025-06-03T07:10:10.081439+00:00"} {"global_step": 234233, "acc_step": 0, "speed/wps": 5532.774823794343, "speed/FLOPS": 244520327902954.28, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04550202935934067, "optim/lr": 1.691316925052444e-05, "optim/total_tokens": 1964888817664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2630313634872437, "created_at": "2025-06-03T07:10:13.047757+00:00"} {"global_step": 234234, "acc_step": 0, "speed/wps": 5512.438674664611, "speed/FLOPS": 243621574201267.34, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04671824350953102, "optim/lr": 1.6909622025430116e-05, "optim/total_tokens": 1964897206272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2674177885055542, "created_at": "2025-06-03T07:10:16.023008+00:00"} {"global_step": 234235, "acc_step": 0, "speed/wps": 5511.844710324074, "speed/FLOPS": 243595324017600.7, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04541383311152458, "optim/lr": 1.690607480033557e-05, "optim/total_tokens": 1964905594880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.27269446849823, "created_at": "2025-06-03T07:10:18.998882+00:00"} {"global_step": 234236, "acc_step": 0, "speed/wps": 5513.616638659371, "speed/FLOPS": 243673634180469.44, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04850982502102852, "optim/lr": 1.6902527575241023e-05, "optim/total_tokens": 1964913983488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2677041292190552, "created_at": "2025-06-03T07:10:21.974223+00:00"} {"global_step": 234237, "acc_step": 0, "speed/wps": 5503.0382315917905, "speed/FLOPS": 243206122733278.12, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04492587596178055, "optim/lr": 1.6898980350146697e-05, "optim/total_tokens": 1964922372096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2740333080291748, "created_at": "2025-06-03T07:10:24.955019+00:00"} {"global_step": 234238, "acc_step": 0, "speed/wps": 5529.953387795678, "speed/FLOPS": 244395634873231.88, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.053561732172966, "optim/lr": 1.689543312505215e-05, "optim/total_tokens": 1964930760704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2448762655258179, "created_at": "2025-06-03T07:10:27.921287+00:00"} {"global_step": 234239, "acc_step": 0, "speed/wps": 5501.7066242519095, "speed/FLOPS": 243147272504639.6, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.94 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.94, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046517398208379745, "optim/lr": 1.6891885899957604e-05, "optim/total_tokens": 1964939149312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2564209699630737, "created_at": "2025-06-03T07:10:30.902478+00:00"} {"global_step": 234240, "acc_step": 0, "speed/wps": 5503.9454753440605, "speed/FLOPS": 243246218263433.97, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04829034209251404, "optim/lr": 1.6888338674863058e-05, "optim/total_tokens": 1964947537920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2769211530685425, "created_at": "2025-06-03T07:10:33.882627+00:00"} {"global_step": 234241, "acc_step": 0, "speed/wps": 5508.955793549628, "speed/FLOPS": 243467648682986.66, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04655561223626137, "optim/lr": 1.6884791449768732e-05, "optim/total_tokens": 1964955926528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2729181051254272, "created_at": "2025-06-03T07:10:36.859800+00:00"} {"global_step": 234242, "acc_step": 0, "speed/wps": 5524.364403295529, "speed/FLOPS": 244148630365341.22, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04969716817140579, "optim/lr": 1.6881244224674185e-05, "optim/total_tokens": 1964964315136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2652535438537598, "created_at": "2025-06-03T07:10:39.831446+00:00"} {"global_step": 234243, "acc_step": 0, "speed/wps": 5525.581022886412, "speed/FLOPS": 244202398724034.7, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04558270424604416, "optim/lr": 1.687769699957964e-05, "optim/total_tokens": 1964972703744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2605113983154297, "created_at": "2025-06-03T07:10:42.802598+00:00"} {"global_step": 234244, "acc_step": 0, "speed/wps": 5518.19451841837, "speed/FLOPS": 243875953034104.4, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046201273798942566, "optim/lr": 1.6874149774485093e-05, "optim/total_tokens": 1964981092352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2819087505340576, "created_at": "2025-06-03T07:10:45.779110+00:00"} {"global_step": 234245, "acc_step": 0, "speed/wps": 5514.789233123568, "speed/FLOPS": 243725456853904.38, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04769724979996681, "optim/lr": 1.6870602549390767e-05, "optim/total_tokens": 1964989480960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2722457647323608, "created_at": "2025-06-03T07:10:48.753596+00:00"} {"global_step": 234246, "acc_step": 0, "speed/wps": 5515.48290461723, "speed/FLOPS": 243756113583391.66, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04451528191566467, "optim/lr": 1.686705532429622e-05, "optim/total_tokens": 1964997869568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2648651599884033, "created_at": "2025-06-03T07:10:51.731193+00:00"} {"global_step": 234247, "acc_step": 0, "speed/wps": 5503.651221257681, "speed/FLOPS": 243233213738944.94, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0504506453871727, "optim/lr": 1.6863508099201674e-05, "optim/total_tokens": 1965006258176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.267146110534668, "created_at": "2025-06-03T07:10:54.714760+00:00"} {"global_step": 234248, "acc_step": 0, "speed/wps": 5506.108723092762, "speed/FLOPS": 243341822741420.88, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.93 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.93, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04520580545067787, "optim/lr": 1.6859960874107127e-05, "optim/total_tokens": 1965014646784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.275718331336975, "created_at": "2025-06-03T07:10:57.698039+00:00"} {"global_step": 234249, "acc_step": 0, "speed/wps": 5508.361581725733, "speed/FLOPS": 243441387561822.38, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05056409537792206, "optim/lr": 1.68564136490128e-05, "optim/total_tokens": 1965023035392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2633136510849, "created_at": "2025-06-03T07:11:00.677835+00:00"} {"global_step": 234250, "acc_step": 0, "speed/wps": 5518.051674102227, "speed/FLOPS": 243869640046474.38, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04725543037056923, "optim/lr": 1.6852866423918255e-05, "optim/total_tokens": 1965031424000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2704553604125977, "created_at": "2025-06-03T07:11:03.650457+00:00"} {"global_step": 234251, "acc_step": 0, "speed/wps": 5521.593775487289, "speed/FLOPS": 244026182797575.72, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04794170334935188, "optim/lr": 1.684931919882371e-05, "optim/total_tokens": 1965039812608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2786122560501099, "created_at": "2025-06-03T07:11:06.624111+00:00"} {"global_step": 234252, "acc_step": 0, "speed/wps": 5521.2848485687355, "speed/FLOPS": 244012529809006.97, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04544674605131149, "optim/lr": 1.6845771973729162e-05, "optim/total_tokens": 1965048201216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2825496196746826, "created_at": "2025-06-03T07:11:09.594899+00:00"} {"global_step": 234253, "acc_step": 0, "speed/wps": 5520.781295912413, "speed/FLOPS": 243990275359013.66, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.051547326147556305, "optim/lr": 1.684222474863484e-05, "optim/total_tokens": 1965056589824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2652199268341064, "created_at": "2025-06-03T07:11:12.566007+00:00"} {"global_step": 234254, "acc_step": 0, "speed/wps": 5524.1062811437805, "speed/FLOPS": 244137222687422.88, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0476076602935791, "optim/lr": 1.6838677523540293e-05, "optim/total_tokens": 1965064978432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2837364673614502, "created_at": "2025-06-03T07:11:15.535836+00:00"} {"global_step": 234255, "acc_step": 0, "speed/wps": 5518.538001446641, "speed/FLOPS": 243891133225848.5, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04683953523635864, "optim/lr": 1.6835130298445743e-05, "optim/total_tokens": 1965073367040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2700204849243164, "created_at": "2025-06-03T07:11:18.508090+00:00"} {"global_step": 234256, "acc_step": 0, "speed/wps": 5500.171213932925, "speed/FLOPS": 243079415227482.9, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04496821016073227, "optim/lr": 1.6831583073351197e-05, "optim/total_tokens": 1965081755648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.269731879234314, "created_at": "2025-06-03T07:11:21.490245+00:00"} {"global_step": 234257, "acc_step": 0, "speed/wps": 5499.443547912697, "speed/FLOPS": 243047256113921.2, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.92 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.92, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044934261590242386, "optim/lr": 1.6828035848256874e-05, "optim/total_tokens": 1965090144256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.27671217918396, "created_at": "2025-06-03T07:11:24.472747+00:00"} {"global_step": 234258, "acc_step": 0, "speed/wps": 5517.70703412954, "speed/FLOPS": 243854408723708.94, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04502927511930466, "optim/lr": 1.6824488623162327e-05, "optim/total_tokens": 1965098532864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.258948802947998, "created_at": "2025-06-03T07:11:27.445593+00:00"} {"global_step": 234259, "acc_step": 0, "speed/wps": 5518.100063040364, "speed/FLOPS": 243871778589863.03, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045308616012334824, "optim/lr": 1.682094139806778e-05, "optim/total_tokens": 1965106921472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.263784408569336, "created_at": "2025-06-03T07:11:30.419489+00:00"} {"global_step": 234260, "acc_step": 0, "speed/wps": 5517.747432325082, "speed/FLOPS": 243856194117175.16, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04927660897374153, "optim/lr": 1.681739417297323e-05, "optim/total_tokens": 1965115310080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2633323669433594, "created_at": "2025-06-03T07:11:33.394260+00:00"} {"global_step": 234261, "acc_step": 0, "speed/wps": 5514.455171823833, "speed/FLOPS": 243710693054336.8, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04606766998767853, "optim/lr": 1.681384694787891e-05, "optim/total_tokens": 1965123698688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2832942008972168, "created_at": "2025-06-03T07:11:36.369267+00:00"} {"global_step": 234262, "acc_step": 0, "speed/wps": 5513.27621283754, "speed/FLOPS": 243658589101601.78, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04612568020820618, "optim/lr": 1.6810299722784362e-05, "optim/total_tokens": 1965132087296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.274859070777893, "created_at": "2025-06-03T07:11:39.345204+00:00"} {"global_step": 234263, "acc_step": 0, "speed/wps": 5511.753366864462, "speed/FLOPS": 243591287104224.03, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045958977192640305, "optim/lr": 1.6806752497689816e-05, "optim/total_tokens": 1965140475904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2676212787628174, "created_at": "2025-06-03T07:11:42.324896+00:00"} {"global_step": 234264, "acc_step": 0, "speed/wps": 5517.083251675646, "speed/FLOPS": 243826840732054.88, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.050498779863119125, "optim/lr": 1.680320527259549e-05, "optim/total_tokens": 1965148864512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2798731327056885, "created_at": "2025-06-03T07:11:45.301308+00:00"} {"global_step": 234265, "acc_step": 0, "speed/wps": 5506.747159671346, "speed/FLOPS": 243370038370379.6, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045390766113996506, "optim/lr": 1.6799658047500943e-05, "optim/total_tokens": 1965157253120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2656594514846802, "created_at": "2025-06-03T07:11:48.279756+00:00"} {"global_step": 234266, "acc_step": 0, "speed/wps": 5510.551485448012, "speed/FLOPS": 243538170097403.7, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047923799604177475, "optim/lr": 1.6796110822406397e-05, "optim/total_tokens": 1965165641728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2700728178024292, "created_at": "2025-06-03T07:11:51.256415+00:00"} {"global_step": 234267, "acc_step": 0, "speed/wps": 5519.865343429195, "speed/FLOPS": 243949794947525.22, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045460302382707596, "optim/lr": 1.679256359731185e-05, "optim/total_tokens": 1965174030336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2727962732315063, "created_at": "2025-06-03T07:11:54.228083+00:00"} {"global_step": 234268, "acc_step": 0, "speed/wps": 5525.351952478659, "speed/FLOPS": 244192274984500.62, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05035388097167015, "optim/lr": 1.6789016372217524e-05, "optim/total_tokens": 1965182418944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2708967924118042, "created_at": "2025-06-03T07:11:57.196567+00:00"} {"global_step": 234269, "acc_step": 0, "speed/wps": 5513.80296159578, "speed/FLOPS": 243681868700571.47, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.048199620097875595, "optim/lr": 1.6785469147122978e-05, "optim/total_tokens": 1965190807552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2552319765090942, "created_at": "2025-06-03T07:12:00.172443+00:00"} {"global_step": 234270, "acc_step": 0, "speed/wps": 5519.232206009621, "speed/FLOPS": 243921813514271.16, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.050051964819431305, "optim/lr": 1.678192192202843e-05, "optim/total_tokens": 1965199196160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2575948238372803, "created_at": "2025-06-03T07:12:03.144347+00:00"} {"global_step": 234271, "acc_step": 0, "speed/wps": 5516.30519563993, "speed/FLOPS": 243792454637728.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05198562890291214, "optim/lr": 1.6778374696933885e-05, "optim/total_tokens": 1965207584768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2786755561828613, "created_at": "2025-06-03T07:12:06.121003+00:00"} {"global_step": 234272, "acc_step": 0, "speed/wps": 5515.873702223648, "speed/FLOPS": 243773384837311.88, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.9 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.9, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04510948434472084, "optim/lr": 1.677482747183956e-05, "optim/total_tokens": 1965215973376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.263899803161621, "created_at": "2025-06-03T07:12:09.096906+00:00"} {"global_step": 234273, "acc_step": 0, "speed/wps": 5518.155857108875, "speed/FLOPS": 243874244402111.28, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044912517070770264, "optim/lr": 1.6771280246745012e-05, "optim/total_tokens": 1965224361984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.272960901260376, "created_at": "2025-06-03T07:12:12.073950+00:00"} {"global_step": 234274, "acc_step": 0, "speed/wps": 5498.617065561542, "speed/FLOPS": 243010729824320.3, "speed/curr_iter_time": 2.9785, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9785, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04459536820650101, "optim/lr": 1.6767733021650466e-05, "optim/total_tokens": 1965232750592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2620441913604736, "created_at": "2025-06-03T07:12:15.061014+00:00"} {"global_step": 234275, "acc_step": 0, "speed/wps": 5497.710306052082, "speed/FLOPS": 242970655695218.06, "speed/curr_iter_time": 2.9789, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9789, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.91 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.91, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045288655906915665, "optim/lr": 1.676418579655592e-05, "optim/total_tokens": 1965241139200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2596447467803955, "created_at": "2025-06-03T07:12:18.049630+00:00"} {"global_step": 234276, "acc_step": 0, "speed/wps": 5526.792687820115, "speed/FLOPS": 244255948112241.03, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04550594836473465, "optim/lr": 1.6760638571461593e-05, "optim/total_tokens": 1965249527808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.269587755203247, "created_at": "2025-06-03T07:12:21.022337+00:00"} {"global_step": 234277, "acc_step": 0, "speed/wps": 5529.438627463753, "speed/FLOPS": 244372885101343.0, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04487760365009308, "optim/lr": 1.6757091346367047e-05, "optim/total_tokens": 1965257916416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2883343696594238, "created_at": "2025-06-03T07:12:23.992932+00:00"} {"global_step": 234278, "acc_step": 0, "speed/wps": 5526.110343483323, "speed/FLOPS": 244225791985109.72, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04790767654776573, "optim/lr": 1.67535441212725e-05, "optim/total_tokens": 1965266305024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2755601406097412, "created_at": "2025-06-03T07:12:26.961516+00:00"} {"global_step": 234279, "acc_step": 0, "speed/wps": 5516.9184102406825, "speed/FLOPS": 243819555584364.4, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045956410467624664, "optim/lr": 1.6749996896177954e-05, "optim/total_tokens": 1965274693632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2805981636047363, "created_at": "2025-06-03T07:12:29.935079+00:00"} {"global_step": 234280, "acc_step": 0, "speed/wps": 5513.333228620493, "speed/FLOPS": 243661108907375.1, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04576333239674568, "optim/lr": 1.674644967108363e-05, "optim/total_tokens": 1965283082240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2712887525558472, "created_at": "2025-06-03T07:12:32.911583+00:00"} {"global_step": 234281, "acc_step": 0, "speed/wps": 5517.158382387402, "speed/FLOPS": 243830161124960.6, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0456506572663784, "optim/lr": 1.6742902445989082e-05, "optim/total_tokens": 1965291470848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2844007015228271, "created_at": "2025-06-03T07:12:35.888496+00:00"} {"global_step": 234282, "acc_step": 0, "speed/wps": 5516.986701924558, "speed/FLOPS": 243822573727243.16, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045882448554039, "optim/lr": 1.6739355220894535e-05, "optim/total_tokens": 1965299859456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.282034158706665, "created_at": "2025-06-03T07:12:38.865054+00:00"} {"global_step": 234283, "acc_step": 0, "speed/wps": 5522.428588450207, "speed/FLOPS": 244063077257576.6, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04466332867741585, "optim/lr": 1.673580799579999e-05, "optim/total_tokens": 1965308248064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2720121145248413, "created_at": "2025-06-03T07:12:41.835348+00:00"} {"global_step": 234284, "acc_step": 0, "speed/wps": 5534.351648368899, "speed/FLOPS": 244590015478229.8, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.48, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047688428312540054, "optim/lr": 1.6732260770705666e-05, "optim/total_tokens": 1965316636672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.26899254322052, "created_at": "2025-06-03T07:12:44.804918+00:00"} {"global_step": 234285, "acc_step": 0, "speed/wps": 5526.666143013676, "speed/FLOPS": 244250355479511.47, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044816456735134125, "optim/lr": 1.672871354561112e-05, "optim/total_tokens": 1965325025280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.277844786643982, "created_at": "2025-06-03T07:12:47.776768+00:00"} {"global_step": 234286, "acc_step": 0, "speed/wps": 5525.626347906081, "speed/FLOPS": 244204401857909.56, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04605196416378021, "optim/lr": 1.672516632051657e-05, "optim/total_tokens": 1965333413888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2623311281204224, "created_at": "2025-06-03T07:12:50.745328+00:00"} {"global_step": 234287, "acc_step": 0, "speed/wps": 5512.465470829113, "speed/FLOPS": 243622758454583.1, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04497203230857849, "optim/lr": 1.6721619095422024e-05, "optim/total_tokens": 1965341802496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2861310243606567, "created_at": "2025-06-03T07:12:53.724668+00:00"} {"global_step": 234288, "acc_step": 0, "speed/wps": 5508.225653559229, "speed/FLOPS": 243435380232606.28, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046083685010671616, "optim/lr": 1.67180718703277e-05, "optim/total_tokens": 1965350191104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2598472833633423, "created_at": "2025-06-03T07:12:56.703376+00:00"} {"global_step": 234289, "acc_step": 0, "speed/wps": 5518.441510262408, "speed/FLOPS": 243886868809392.06, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04777387157082558, "optim/lr": 1.6714524645233154e-05, "optim/total_tokens": 1965358579712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2774244546890259, "created_at": "2025-06-03T07:12:59.679597+00:00"} {"global_step": 234290, "acc_step": 0, "speed/wps": 5514.495747132445, "speed/FLOPS": 243712486275294.22, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04613987356424332, "optim/lr": 1.6710977420138608e-05, "optim/total_tokens": 1965366968320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2638481855392456, "created_at": "2025-06-03T07:13:02.658202+00:00"} {"global_step": 234291, "acc_step": 0, "speed/wps": 5511.183767025437, "speed/FLOPS": 243566113706815.4, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04847461357712746, "optim/lr": 1.6707430195044282e-05, "optim/total_tokens": 1965375356928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2605704069137573, "created_at": "2025-06-03T07:13:05.635939+00:00"} {"global_step": 234292, "acc_step": 0, "speed/wps": 5528.767474075056, "speed/FLOPS": 244343223556837.06, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04619181156158447, "optim/lr": 1.6703882969949735e-05, "optim/total_tokens": 1965383745536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2736209630966187, "created_at": "2025-06-03T07:13:08.602633+00:00"} {"global_step": 234293, "acc_step": 0, "speed/wps": 5529.083321895645, "speed/FLOPS": 244357182413851.38, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045961953699588776, "optim/lr": 1.670033574485519e-05, "optim/total_tokens": 1965392134144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2634060382843018, "created_at": "2025-06-03T07:13:11.571145+00:00"} {"global_step": 234294, "acc_step": 0, "speed/wps": 5520.639121063897, "speed/FLOPS": 243983991958426.06, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04560140520334244, "optim/lr": 1.6696788519760643e-05, "optim/total_tokens": 1965400522752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2694569826126099, "created_at": "2025-06-03T07:13:14.542548+00:00"} {"global_step": 234295, "acc_step": 0, "speed/wps": 5522.860229439651, "speed/FLOPS": 244082153579971.2, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0496399886906147, "optim/lr": 1.6693241294666317e-05, "optim/total_tokens": 1965408911360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2625937461853027, "created_at": "2025-06-03T07:13:17.517215+00:00"} {"global_step": 234296, "acc_step": 0, "speed/wps": 5523.086214445522, "speed/FLOPS": 244092140960534.56, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044749557971954346, "optim/lr": 1.668969406957177e-05, "optim/total_tokens": 1965417299968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2586137056350708, "created_at": "2025-06-03T07:13:20.487300+00:00"} {"global_step": 234297, "acc_step": 0, "speed/wps": 5519.202865315757, "speed/FLOPS": 243920516805781.62, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.053277358412742615, "optim/lr": 1.6686146844477224e-05, "optim/total_tokens": 1965425688576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2652226686477661, "created_at": "2025-06-03T07:13:23.459063+00:00"} {"global_step": 234298, "acc_step": 0, "speed/wps": 5525.89678227929, "speed/FLOPS": 244216353672996.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045651715248823166, "optim/lr": 1.6682599619382677e-05, "optim/total_tokens": 1965434077184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2778328657150269, "created_at": "2025-06-03T07:13:26.432011+00:00"} {"global_step": 234299, "acc_step": 0, "speed/wps": 5525.632492279941, "speed/FLOPS": 244204673407784.44, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05005158483982086, "optim/lr": 1.667905239428835e-05, "optim/total_tokens": 1965442465792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.261872410774231, "created_at": "2025-06-03T07:13:29.404928+00:00"} {"global_step": 234300, "acc_step": 0, "speed/wps": 5524.030471503132, "speed/FLOPS": 244133872289335.12, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046292487531900406, "optim/lr": 1.6675505169193805e-05, "optim/total_tokens": 1965450854400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.280214548110962, "created_at": "2025-06-03T07:13:32.377135+00:00"} {"global_step": 234301, "acc_step": 0, "speed/wps": 5535.98585904892, "speed/FLOPS": 244662239225638.22, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05082084238529205, "optim/lr": 1.667195794409926e-05, "optim/total_tokens": 1965459243008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2798502445220947, "created_at": "2025-06-03T07:13:35.344435+00:00"} {"global_step": 234302, "acc_step": 0, "speed/wps": 5527.293938720867, "speed/FLOPS": 244278100836419.56, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045032668858766556, "optim/lr": 1.6668410719004712e-05, "optim/total_tokens": 1965467631616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2723039388656616, "created_at": "2025-06-03T07:13:38.317141+00:00"} {"global_step": 234303, "acc_step": 0, "speed/wps": 5514.864110334134, "speed/FLOPS": 243728766043355.1, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.87 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.87, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04941527545452118, "optim/lr": 1.6664863493910386e-05, "optim/total_tokens": 1965476020224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2699357271194458, "created_at": "2025-06-03T07:13:41.291685+00:00"} {"global_step": 234304, "acc_step": 0, "speed/wps": 5509.259418515123, "speed/FLOPS": 243481067352368.1, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04659120738506317, "optim/lr": 1.666131626881584e-05, "optim/total_tokens": 1965484408832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2695016860961914, "created_at": "2025-06-03T07:13:44.269061+00:00"} {"global_step": 234305, "acc_step": 0, "speed/wps": 5495.239597263381, "speed/FLOPS": 242861463012991.5, "speed/curr_iter_time": 2.9802, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9802, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04833909124135971, "optim/lr": 1.6657769043721293e-05, "optim/total_tokens": 1965492797440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2662005424499512, "created_at": "2025-06-03T07:13:47.255629+00:00"} {"global_step": 234306, "acc_step": 0, "speed/wps": 5487.951232004332, "speed/FLOPS": 242539354573776.72, "speed/curr_iter_time": 2.9843, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9843, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04587215930223465, "optim/lr": 1.6654221818626747e-05, "optim/total_tokens": 1965501186048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2680109739303589, "created_at": "2025-06-03T07:13:50.245255+00:00"} {"global_step": 234307, "acc_step": 0, "speed/wps": 5481.618981414611, "speed/FLOPS": 242259501509107.72, "speed/curr_iter_time": 2.9861, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9861, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04667247086763382, "optim/lr": 1.6650674593532424e-05, "optim/total_tokens": 1965509574656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2940800189971924, "created_at": "2025-06-03T07:13:53.237708+00:00"} {"global_step": 234308, "acc_step": 0, "speed/wps": 5488.532370459965, "speed/FLOPS": 242565037918979.4, "speed/curr_iter_time": 2.9839, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9839, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04619656130671501, "optim/lr": 1.6647127368437874e-05, "optim/total_tokens": 1965517963264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2656059265136719, "created_at": "2025-06-03T07:13:56.226121+00:00"} {"global_step": 234309, "acc_step": 0, "speed/wps": 5491.9669355344195, "speed/FLOPS": 242716828115572.62, "speed/curr_iter_time": 2.9821, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9821, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.89 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.89, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04503680020570755, "optim/lr": 1.6643580143343328e-05, "optim/total_tokens": 1965526351872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2818769216537476, "created_at": "2025-06-03T07:13:59.212298+00:00"} {"global_step": 234310, "acc_step": 0, "speed/wps": 5496.3572393573695, "speed/FLOPS": 242910857072934.94, "speed/curr_iter_time": 2.9782, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9782, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05347728729248047, "optim/lr": 1.664003291824878e-05, "optim/total_tokens": 1965534740480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2711650133132935, "created_at": "2025-06-03T07:14:02.197190+00:00"} {"global_step": 234311, "acc_step": 0, "speed/wps": 5504.026135853266, "speed/FLOPS": 243249783045082.94, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.88 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.88, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04794000834226608, "optim/lr": 1.663648569315446e-05, "optim/total_tokens": 1965543129088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2794718742370605, "created_at": "2025-06-03T07:14:05.177672+00:00"} {"global_step": 234312, "acc_step": 0, "speed/wps": 5518.062371451348, "speed/FLOPS": 243870112814551.53, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049370262771844864, "optim/lr": 1.6632938468059912e-05, "optim/total_tokens": 1965551517696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2450973987579346, "created_at": "2025-06-03T07:14:08.149944+00:00"} {"global_step": 234313, "acc_step": 0, "speed/wps": 5524.089622774968, "speed/FLOPS": 244136486472786.66, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04614439234137535, "optim/lr": 1.6629391242965362e-05, "optim/total_tokens": 1965559906304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2704538106918335, "created_at": "2025-06-03T07:14:11.119198+00:00"} {"global_step": 234314, "acc_step": 0, "speed/wps": 5515.8076889197855, "speed/FLOPS": 243770467387167.88, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04741714149713516, "optim/lr": 1.6625844017870816e-05, "optim/total_tokens": 1965568294912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2751826047897339, "created_at": "2025-06-03T07:14:14.093419+00:00"} {"global_step": 234315, "acc_step": 0, "speed/wps": 5533.857485268942, "speed/FLOPS": 244568175998567.75, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.62, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045569535344839096, "optim/lr": 1.6622296792776493e-05, "optim/total_tokens": 1965576683520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2567387819290161, "created_at": "2025-06-03T07:14:17.057336+00:00"} {"global_step": 234316, "acc_step": 0, "speed/wps": 5517.998111824187, "speed/FLOPS": 243867272867941.62, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04548950120806694, "optim/lr": 1.6618749567681947e-05, "optim/total_tokens": 1965585072128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2826237678527832, "created_at": "2025-06-03T07:14:20.033117+00:00"} {"global_step": 234317, "acc_step": 0, "speed/wps": 5510.7341423365115, "speed/FLOPS": 243546242596952.7, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045104775577783585, "optim/lr": 1.66152023425874e-05, "optim/total_tokens": 1965593460736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.273917317390442, "created_at": "2025-06-03T07:14:23.009918+00:00"} {"global_step": 234318, "acc_step": 0, "speed/wps": 5533.767524392595, "speed/FLOPS": 244564200188294.72, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.64, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04612766578793526, "optim/lr": 1.6611655117493074e-05, "optim/total_tokens": 1965601849344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2714921236038208, "created_at": "2025-06-03T07:14:25.976915+00:00"} {"global_step": 234319, "acc_step": 0, "speed/wps": 5522.707241190952, "speed/FLOPS": 244075392282443.5, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04782171919941902, "optim/lr": 1.6608107892398528e-05, "optim/total_tokens": 1965610237952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.268181324005127, "created_at": "2025-06-03T07:14:28.947221+00:00"} {"global_step": 234320, "acc_step": 0, "speed/wps": 5529.803507492093, "speed/FLOPS": 244389010930970.3, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049125928431749344, "optim/lr": 1.660456066730398e-05, "optim/total_tokens": 1965618626560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2587101459503174, "created_at": "2025-06-03T07:14:31.913367+00:00"} {"global_step": 234321, "acc_step": 0, "speed/wps": 5522.616032313914, "speed/FLOPS": 244071361316927.78, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047779668122529984, "optim/lr": 1.6601013442209435e-05, "optim/total_tokens": 1965627015168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2619874477386475, "created_at": "2025-06-03T07:14:34.883845+00:00"} {"global_step": 234322, "acc_step": 0, "speed/wps": 5524.21762384798, "speed/FLOPS": 244142143465044.88, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.052342768758535385, "optim/lr": 1.659746621711511e-05, "optim/total_tokens": 1965635403776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2811442613601685, "created_at": "2025-06-03T07:14:37.856893+00:00"} {"global_step": 234323, "acc_step": 0, "speed/wps": 5511.958720990419, "speed/FLOPS": 243600362705493.66, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0457049161195755, "optim/lr": 1.6593918992020562e-05, "optim/total_tokens": 1965643792384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2723424434661865, "created_at": "2025-06-03T07:14:40.837157+00:00"} {"global_step": 234324, "acc_step": 0, "speed/wps": 5514.578648925357, "speed/FLOPS": 243716150110211.1, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04563101381063461, "optim/lr": 1.6590371766926016e-05, "optim/total_tokens": 1965652180992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2608349323272705, "created_at": "2025-06-03T07:14:43.812465+00:00"} {"global_step": 234325, "acc_step": 0, "speed/wps": 5506.406535828979, "speed/FLOPS": 243354984540017.88, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.86 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.86, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04585195332765579, "optim/lr": 1.658682454183147e-05, "optim/total_tokens": 1965660569600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2698601484298706, "created_at": "2025-06-03T07:14:46.792313+00:00"} {"global_step": 234326, "acc_step": 0, "speed/wps": 5534.523291721255, "speed/FLOPS": 244597601235853.66, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044775642454624176, "optim/lr": 1.6583277316737144e-05, "optim/total_tokens": 1965668958208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2770195007324219, "created_at": "2025-06-03T07:14:49.761048+00:00"} {"global_step": 234327, "acc_step": 0, "speed/wps": 5525.478098256449, "speed/FLOPS": 244197849982206.3, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.81, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0451253280043602, "optim/lr": 1.6579730091642597e-05, "optim/total_tokens": 1965677346816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.265257716178894, "created_at": "2025-06-03T07:14:52.730832+00:00"} {"global_step": 234328, "acc_step": 0, "speed/wps": 5526.074387600311, "speed/FLOPS": 244224202919119.47, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045065004378557205, "optim/lr": 1.657618286654805e-05, "optim/total_tokens": 1965685735424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2683387994766235, "created_at": "2025-06-03T07:14:55.699222+00:00"} {"global_step": 234329, "acc_step": 0, "speed/wps": 5515.457039242862, "speed/FLOPS": 243754970466235.6, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0454779714345932, "optim/lr": 1.6572635641453504e-05, "optim/total_tokens": 1965694124032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2717286348342896, "created_at": "2025-06-03T07:14:58.675681+00:00"} {"global_step": 234330, "acc_step": 0, "speed/wps": 5521.632786105745, "speed/FLOPS": 244027906867237.03, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045276742428541183, "optim/lr": 1.6569088416359178e-05, "optim/total_tokens": 1965702512640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2691986560821533, "created_at": "2025-06-03T07:15:01.648922+00:00"} {"global_step": 234331, "acc_step": 0, "speed/wps": 5522.342265574983, "speed/FLOPS": 244059262228332.22, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04511373117566109, "optim/lr": 1.6565541191264632e-05, "optim/total_tokens": 1965710901248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2753723859786987, "created_at": "2025-06-03T07:15:04.621417+00:00"} {"global_step": 234332, "acc_step": 0, "speed/wps": 5529.057511265128, "speed/FLOPS": 244356041716093.3, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04449842870235443, "optim/lr": 1.6561993966170085e-05, "optim/total_tokens": 1965719289856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2585965394973755, "created_at": "2025-06-03T07:15:07.588183+00:00"} {"global_step": 234333, "acc_step": 0, "speed/wps": 5519.958858578948, "speed/FLOPS": 243953927838490.38, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049221113324165344, "optim/lr": 1.655844674107554e-05, "optim/total_tokens": 1965727678464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2797622680664062, "created_at": "2025-06-03T07:15:10.559122+00:00"} {"global_step": 234334, "acc_step": 0, "speed/wps": 5539.93004976244, "speed/FLOPS": 244836552266977.62, "speed/curr_iter_time": 2.9547, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9547, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.33, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04543791338801384, "optim/lr": 1.6554899515981213e-05, "optim/total_tokens": 1965736067072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2691631317138672, "created_at": "2025-06-03T07:15:13.519896+00:00"} {"global_step": 234335, "acc_step": 0, "speed/wps": 5530.049884330287, "speed/FLOPS": 244399899526147.53, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04664843529462814, "optim/lr": 1.6551352290886666e-05, "optim/total_tokens": 1965744455680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2773938179016113, "created_at": "2025-06-03T07:15:16.487743+00:00"} {"global_step": 234336, "acc_step": 0, "speed/wps": 5526.491109471336, "speed/FLOPS": 244242619892842.9, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04491858184337616, "optim/lr": 1.654780506579212e-05, "optim/total_tokens": 1965752844288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2600277662277222, "created_at": "2025-06-03T07:15:19.457365+00:00"} {"global_step": 234337, "acc_step": 0, "speed/wps": 5518.624982727893, "speed/FLOPS": 243894977353269.28, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04673737287521362, "optim/lr": 1.6544257840697574e-05, "optim/total_tokens": 1965761232896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.258055567741394, "created_at": "2025-06-03T07:15:22.429771+00:00"} {"global_step": 234338, "acc_step": 0, "speed/wps": 5522.03515721582, "speed/FLOPS": 244045689610780.28, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04558946564793587, "optim/lr": 1.654071061560325e-05, "optim/total_tokens": 1965769621504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.272944688796997, "created_at": "2025-06-03T07:15:25.399893+00:00"} {"global_step": 234339, "acc_step": 0, "speed/wps": 5521.674506964553, "speed/FLOPS": 244029750715649.62, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04774267226457596, "optim/lr": 1.65371633905087e-05, "optim/total_tokens": 1965778010112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2726619243621826, "created_at": "2025-06-03T07:15:28.370990+00:00"} {"global_step": 234340, "acc_step": 0, "speed/wps": 5526.531654625419, "speed/FLOPS": 244244411781124.47, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05118224024772644, "optim/lr": 1.6533616165414155e-05, "optim/total_tokens": 1965786398720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2582108974456787, "created_at": "2025-06-03T07:15:31.339414+00:00"} {"global_step": 234341, "acc_step": 0, "speed/wps": 5502.739439234103, "speed/FLOPS": 243192917640426.25, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.053965404629707336, "optim/lr": 1.653006894031961e-05, "optim/total_tokens": 1965794787328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2822301387786865, "created_at": "2025-06-03T07:15:34.324586+00:00"} {"global_step": 234342, "acc_step": 0, "speed/wps": 5528.599122517189, "speed/FLOPS": 244335783279680.72, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04689132049679756, "optim/lr": 1.6526521715225286e-05, "optim/total_tokens": 1965803175936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2690436840057373, "created_at": "2025-06-03T07:15:37.291731+00:00"} {"global_step": 234343, "acc_step": 0, "speed/wps": 5527.758837680148, "speed/FLOPS": 244298646990851.2, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.86, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05338159576058388, "optim/lr": 1.652297449013074e-05, "optim/total_tokens": 1965811564544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2548342943191528, "created_at": "2025-06-03T07:15:40.262469+00:00"} {"global_step": 234344, "acc_step": 0, "speed/wps": 5529.838674530994, "speed/FLOPS": 244390565134088.53, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04800904542207718, "optim/lr": 1.651942726503619e-05, "optim/total_tokens": 1965819953152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2753182649612427, "created_at": "2025-06-03T07:15:43.228930+00:00"} {"global_step": 234345, "acc_step": 0, "speed/wps": 5512.238597558858, "speed/FLOPS": 243612731817280.5, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.048791076987981796, "optim/lr": 1.6515880039941643e-05, "optim/total_tokens": 1965828341760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2738163471221924, "created_at": "2025-06-03T07:15:46.207951+00:00"} {"global_step": 234346, "acc_step": 0, "speed/wps": 5512.680373373562, "speed/FLOPS": 243632256047076.84, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.84 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.84, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05574759095907211, "optim/lr": 1.651233281484732e-05, "optim/total_tokens": 1965836730368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.266147255897522, "created_at": "2025-06-03T07:15:49.183257+00:00"} {"global_step": 234347, "acc_step": 0, "speed/wps": 5524.623098680464, "speed/FLOPS": 244160063377232.34, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046918150037527084, "optim/lr": 1.6508785589752774e-05, "optim/total_tokens": 1965845118976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.266605257987976, "created_at": "2025-06-03T07:15:52.152633+00:00"} {"global_step": 234348, "acc_step": 0, "speed/wps": 5518.575556713915, "speed/FLOPS": 243892792976436.72, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.06100206449627876, "optim/lr": 1.6505238364658227e-05, "optim/total_tokens": 1965853507584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2739814519882202, "created_at": "2025-06-03T07:15:55.129478+00:00"} {"global_step": 234349, "acc_step": 0, "speed/wps": 5519.864309450935, "speed/FLOPS": 243949749250978.53, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044759560376405716, "optim/lr": 1.65016911395639e-05, "optim/total_tokens": 1965861896192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.258736252784729, "created_at": "2025-06-03T07:15:58.101265+00:00"} {"global_step": 234350, "acc_step": 0, "speed/wps": 5497.046977070738, "speed/FLOPS": 242941339949468.16, "speed/curr_iter_time": 2.9793, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9793, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.85 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.85, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.055617913603782654, "optim/lr": 1.6498143914469355e-05, "optim/total_tokens": 1965870284800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2797489166259766, "created_at": "2025-06-03T07:16:01.084968+00:00"} {"global_step": 234351, "acc_step": 0, "speed/wps": 5516.505809383664, "speed/FLOPS": 243801320738366.84, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04763554781675339, "optim/lr": 1.649459668937481e-05, "optim/total_tokens": 1965878673408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2651184797286987, "created_at": "2025-06-03T07:16:04.058144+00:00"} {"global_step": 234352, "acc_step": 0, "speed/wps": 5524.527216053345, "speed/FLOPS": 244155825855885.47, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04853442683815956, "optim/lr": 1.6491049464280262e-05, "optim/total_tokens": 1965887062016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2877830266952515, "created_at": "2025-06-03T07:16:07.027427+00:00"} {"global_step": 234353, "acc_step": 0, "speed/wps": 5528.821120525012, "speed/FLOPS": 244345594455337.7, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05107330530881882, "optim/lr": 1.6487502239185936e-05, "optim/total_tokens": 1965895450624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.26260244846344, "created_at": "2025-06-03T07:16:09.994404+00:00"} {"global_step": 234354, "acc_step": 0, "speed/wps": 5530.801755663649, "speed/FLOPS": 244433128390655.78, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 192.68, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04682549461722374, "optim/lr": 1.648395501409139e-05, "optim/total_tokens": 1965903839232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2739689350128174, "created_at": "2025-06-03T07:16:12.960583+00:00"} {"global_step": 234355, "acc_step": 0, "speed/wps": 5526.511042343534, "speed/FLOPS": 244243500823768.38, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04934757202863693, "optim/lr": 1.6480407788996843e-05, "optim/total_tokens": 1965912227840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.256178617477417, "created_at": "2025-06-03T07:16:15.928734+00:00"} {"global_step": 234356, "acc_step": 0, "speed/wps": 5525.988093914642, "speed/FLOPS": 244220389179904.06, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04535939544439316, "optim/lr": 1.6476860563902297e-05, "optim/total_tokens": 1965920616448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2659978866577148, "created_at": "2025-06-03T07:16:18.899837+00:00"} {"global_step": 234357, "acc_step": 0, "speed/wps": 5520.349140961179, "speed/FLOPS": 243971176322138.66, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05025273561477661, "optim/lr": 1.647331333880797e-05, "optim/total_tokens": 1965929005056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2779850959777832, "created_at": "2025-06-03T07:16:21.871078+00:00"} {"global_step": 234358, "acc_step": 0, "speed/wps": 5533.844289553301, "speed/FLOPS": 244567592815478.22, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04658414423465729, "optim/lr": 1.6469766113713424e-05, "optim/total_tokens": 1965937393664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2563691139221191, "created_at": "2025-06-03T07:16:24.835761+00:00"} {"global_step": 234359, "acc_step": 0, "speed/wps": 5520.4106018263055, "speed/FLOPS": 243973892577792.03, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04716537520289421, "optim/lr": 1.6466218888618878e-05, "optim/total_tokens": 1965945782272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.288948655128479, "created_at": "2025-06-03T07:16:27.807351+00:00"} {"global_step": 234360, "acc_step": 0, "speed/wps": 5526.015193815832, "speed/FLOPS": 244221586856826.78, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04717720299959183, "optim/lr": 1.646267166352433e-05, "optim/total_tokens": 1965954170880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2705459594726562, "created_at": "2025-06-03T07:16:30.778279+00:00"} {"global_step": 234361, "acc_step": 0, "speed/wps": 5516.671484219581, "speed/FLOPS": 243808642718113.66, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044457074254751205, "optim/lr": 1.6459124438430005e-05, "optim/total_tokens": 1965962559488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2731306552886963, "created_at": "2025-06-03T07:16:33.752770+00:00"} {"global_step": 234362, "acc_step": 0, "speed/wps": 5519.395649759616, "speed/FLOPS": 243929036891440.0, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04746440425515175, "optim/lr": 1.645557721333546e-05, "optim/total_tokens": 1965970948096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2957446575164795, "created_at": "2025-06-03T07:16:36.724624+00:00"} {"global_step": 234363, "acc_step": 0, "speed/wps": 5531.525782797286, "speed/FLOPS": 244465126684055.75, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04507284238934517, "optim/lr": 1.6452029988240912e-05, "optim/total_tokens": 1965979336704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2557499408721924, "created_at": "2025-06-03T07:16:39.693436+00:00"} {"global_step": 234364, "acc_step": 0, "speed/wps": 5527.863964240274, "speed/FLOPS": 244303293046722.25, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04690169543027878, "optim/lr": 1.6448482763146366e-05, "optim/total_tokens": 1965987725312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2578364610671997, "created_at": "2025-06-03T07:16:42.661949+00:00"} {"global_step": 234365, "acc_step": 0, "speed/wps": 5523.169522556128, "speed/FLOPS": 244095822752613.75, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044877417385578156, "optim/lr": 1.6444935538052043e-05, "optim/total_tokens": 1965996113920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.272045612335205, "created_at": "2025-06-03T07:16:45.635612+00:00"} {"global_step": 234366, "acc_step": 0, "speed/wps": 5514.256862128074, "speed/FLOPS": 243701928780825.34, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04454679414629936, "optim/lr": 1.6441388312957493e-05, "optim/total_tokens": 1966004502528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2616212368011475, "created_at": "2025-06-03T07:16:48.610068+00:00"} {"global_step": 234367, "acc_step": 0, "speed/wps": 5498.069845529133, "speed/FLOPS": 242986545499813.84, "speed/curr_iter_time": 2.9787, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9787, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.83 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.83, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046181827783584595, "optim/lr": 1.6437841087862947e-05, "optim/total_tokens": 1966012891136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2773841619491577, "created_at": "2025-06-03T07:16:51.596201+00:00"} {"global_step": 234368, "acc_step": 0, "speed/wps": 5520.445552487068, "speed/FLOPS": 243975437218104.06, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04779289662837982, "optim/lr": 1.64342938627684e-05, "optim/total_tokens": 1966021279744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2798858880996704, "created_at": "2025-06-03T07:16:54.568073+00:00"} {"global_step": 234369, "acc_step": 0, "speed/wps": 5529.400728246277, "speed/FLOPS": 244371210149916.34, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04550855979323387, "optim/lr": 1.6430746637674078e-05, "optim/total_tokens": 1966029668352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2884483337402344, "created_at": "2025-06-03T07:16:57.534381+00:00"} {"global_step": 234370, "acc_step": 0, "speed/wps": 5527.698179656905, "speed/FLOPS": 244295966216699.78, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047745440155267715, "optim/lr": 1.642719941257953e-05, "optim/total_tokens": 1966038056960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2569606304168701, "created_at": "2025-06-03T07:17:00.501853+00:00"} {"global_step": 234371, "acc_step": 0, "speed/wps": 5506.379982090359, "speed/FLOPS": 243353811000685.22, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04515685886144638, "optim/lr": 1.6423652187484982e-05, "optim/total_tokens": 1966046445568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2620623111724854, "created_at": "2025-06-03T07:17:03.481037+00:00"} {"global_step": 234372, "acc_step": 0, "speed/wps": 5530.5308688141995, "speed/FLOPS": 244421156578434.72, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049509093165397644, "optim/lr": 1.6420104962390435e-05, "optim/total_tokens": 1966054834176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2654926776885986, "created_at": "2025-06-03T07:17:06.446818+00:00"} {"global_step": 234373, "acc_step": 0, "speed/wps": 5520.872682426798, "speed/FLOPS": 243994314175190.88, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04713967815041542, "optim/lr": 1.6416557737296113e-05, "optim/total_tokens": 1966063222784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2734427452087402, "created_at": "2025-06-03T07:17:09.421904+00:00"} {"global_step": 234374, "acc_step": 0, "speed/wps": 5510.489339451097, "speed/FLOPS": 243535423562432.12, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05086522921919823, "optim/lr": 1.6413010512201566e-05, "optim/total_tokens": 1966071611392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2750657796859741, "created_at": "2025-06-03T07:17:12.399254+00:00"} {"global_step": 234375, "acc_step": 0, "speed/wps": 5522.751436337966, "speed/FLOPS": 244077345481730.25, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04672294110059738, "optim/lr": 1.640946328710702e-05, "optim/total_tokens": 1966080000000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2637754678726196, "created_at": "2025-06-03T07:17:15.369906+00:00"} {"global_step": 234376, "acc_step": 0, "speed/wps": 5513.989995347396, "speed/FLOPS": 243690134635067.34, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.82 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.82, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0516446977853775, "optim/lr": 1.6405916062012694e-05, "optim/total_tokens": 1966088388608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.277881145477295, "created_at": "2025-06-03T07:17:18.344325+00:00"} {"global_step": 234377, "acc_step": 0, "speed/wps": 5530.7231300674675, "speed/FLOPS": 244429653541746.84, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045310262590646744, "optim/lr": 1.6402368836918147e-05, "optim/total_tokens": 1966096777216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2729853391647339, "created_at": "2025-06-03T07:17:21.309823+00:00"} {"global_step": 234378, "acc_step": 0, "speed/wps": 5519.33546345637, "speed/FLOPS": 243926376964897.94, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04697167128324509, "optim/lr": 1.63988216118236e-05, "optim/total_tokens": 1966105165824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2632627487182617, "created_at": "2025-06-03T07:17:24.282374+00:00"} {"global_step": 234379, "acc_step": 0, "speed/wps": 5528.745269168042, "speed/FLOPS": 244342242213602.03, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04515133053064346, "optim/lr": 1.6395274386729054e-05, "optim/total_tokens": 1966113554432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2766722440719604, "created_at": "2025-06-03T07:17:27.248825+00:00"} {"global_step": 234380, "acc_step": 0, "speed/wps": 5526.13389554768, "speed/FLOPS": 244226832865803.94, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04631969705224037, "optim/lr": 1.6391727161634728e-05, "optim/total_tokens": 1966121943040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2698014974594116, "created_at": "2025-06-03T07:17:30.216988+00:00"} {"global_step": 234381, "acc_step": 0, "speed/wps": 5513.418554716014, "speed/FLOPS": 243664879884058.56, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04901239275932312, "optim/lr": 1.6388179936540182e-05, "optim/total_tokens": 1966130331648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2700196504592896, "created_at": "2025-06-03T07:17:33.192152+00:00"} {"global_step": 234382, "acc_step": 0, "speed/wps": 5526.401113638216, "speed/FLOPS": 244238642537659.44, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04900244623422623, "optim/lr": 1.6384632711445635e-05, "optim/total_tokens": 1966138720256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2675608396530151, "created_at": "2025-06-03T07:17:36.163059+00:00"} {"global_step": 234383, "acc_step": 0, "speed/wps": 5509.887785239183, "speed/FLOPS": 243508837945299.12, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05138406902551651, "optim/lr": 1.638108548635109e-05, "optim/total_tokens": 1966147108864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2621910572052002, "created_at": "2025-06-03T07:17:39.139782+00:00"} {"global_step": 234384, "acc_step": 0, "speed/wps": 5523.221840510636, "speed/FLOPS": 244098134938415.44, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045187585055828094, "optim/lr": 1.6377538261256763e-05, "optim/total_tokens": 1966155497472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2786123752593994, "created_at": "2025-06-03T07:17:42.113045+00:00"} {"global_step": 234385, "acc_step": 0, "speed/wps": 5508.105525377358, "speed/FLOPS": 243430071181839.4, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.81 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.81, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05545688048005104, "optim/lr": 1.6373991036162216e-05, "optim/total_tokens": 1966163886080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2850697040557861, "created_at": "2025-06-03T07:17:45.094156+00:00"} {"global_step": 234386, "acc_step": 0, "speed/wps": 5527.515904864996, "speed/FLOPS": 244287910603864.34, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04709809273481369, "optim/lr": 1.637044381106767e-05, "optim/total_tokens": 1966172274688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2844336032867432, "created_at": "2025-06-03T07:17:48.063255+00:00"} {"global_step": 234387, "acc_step": 0, "speed/wps": 5524.529091897237, "speed/FLOPS": 244155908758584.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.048220254480838776, "optim/lr": 1.6366896585973124e-05, "optim/total_tokens": 1966180663296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2529493570327759, "created_at": "2025-06-03T07:17:51.032520+00:00"} {"global_step": 234388, "acc_step": 0, "speed/wps": 5537.702154032191, "speed/FLOPS": 244738090679104.72, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 192.45, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04471897333860397, "optim/lr": 1.6363349360878798e-05, "optim/total_tokens": 1966189051904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2661458253860474, "created_at": "2025-06-03T07:17:53.998521+00:00"} {"global_step": 234389, "acc_step": 0, "speed/wps": 5526.4179222325865, "speed/FLOPS": 244239385391496.44, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047857046127319336, "optim/lr": 1.635980213578425e-05, "optim/total_tokens": 1966197440512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2598038911819458, "created_at": "2025-06-03T07:17:56.967086+00:00"} {"global_step": 234390, "acc_step": 0, "speed/wps": 5515.7687493258245, "speed/FLOPS": 243768746456425.7, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0464654266834259, "optim/lr": 1.6356254910689705e-05, "optim/total_tokens": 1966205829120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.257213830947876, "created_at": "2025-06-03T07:17:59.942531+00:00"} {"global_step": 234391, "acc_step": 0, "speed/wps": 5517.296284873803, "speed/FLOPS": 243836255709010.66, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047573961317539215, "optim/lr": 1.635270768559516e-05, "optim/total_tokens": 1966214217728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2748908996582031, "created_at": "2025-06-03T07:18:02.915502+00:00"} {"global_step": 234392, "acc_step": 0, "speed/wps": 5518.109323966731, "speed/FLOPS": 243872187875406.72, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04633577540516853, "optim/lr": 1.6349160460500832e-05, "optim/total_tokens": 1966222606336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2774674892425537, "created_at": "2025-06-03T07:18:05.887981+00:00"} {"global_step": 234393, "acc_step": 0, "speed/wps": 5515.3422600318945, "speed/FLOPS": 243749897812604.1, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.8 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.8, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04558030515909195, "optim/lr": 1.6345613235406286e-05, "optim/total_tokens": 1966230994944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2728490829467773, "created_at": "2025-06-03T07:18:08.862152+00:00"} {"global_step": 234394, "acc_step": 0, "speed/wps": 5535.712532375631, "speed/FLOPS": 244650159585691.56, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045204948633909225, "optim/lr": 1.634206601031174e-05, "optim/total_tokens": 1966239383552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2650563716888428, "created_at": "2025-06-03T07:18:11.829087+00:00"} {"global_step": 234395, "acc_step": 0, "speed/wps": 5530.2652413473115, "speed/FLOPS": 244409417204002.88, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 192.72, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04838190972805023, "optim/lr": 1.6338518785217193e-05, "optim/total_tokens": 1966247772160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2743459939956665, "created_at": "2025-06-03T07:18:14.795423+00:00"} {"global_step": 234396, "acc_step": 0, "speed/wps": 5533.139651332782, "speed/FLOPS": 244536451412796.62, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 192.71, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04554281756281853, "optim/lr": 1.633497156012287e-05, "optim/total_tokens": 1966256160768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2547285556793213, "created_at": "2025-06-03T07:18:17.760144+00:00"} {"global_step": 234397, "acc_step": 0, "speed/wps": 5532.575633219209, "speed/FLOPS": 244511524699083.12, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047643717378377914, "optim/lr": 1.633142433502832e-05, "optim/total_tokens": 1966264549376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2748435735702515, "created_at": "2025-06-03T07:18:20.724811+00:00"} {"global_step": 234398, "acc_step": 0, "speed/wps": 5524.218834661514, "speed/FLOPS": 244142196976805.6, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04564238339662552, "optim/lr": 1.6327877109933774e-05, "optim/total_tokens": 1966272937984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.258074402809143, "created_at": "2025-06-03T07:18:23.695234+00:00"} {"global_step": 234399, "acc_step": 0, "speed/wps": 5523.231513571035, "speed/FLOPS": 244098562438173.88, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045379750430583954, "optim/lr": 1.6324329884839228e-05, "optim/total_tokens": 1966281326592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2659938335418701, "created_at": "2025-06-03T07:18:26.665152+00:00"} {"global_step": 234400, "acc_step": 0, "speed/wps": 5521.861029135625, "speed/FLOPS": 244037994040904.0, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04674570634961128, "optim/lr": 1.6320782659744905e-05, "optim/total_tokens": 1966289715200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2673394680023193, "created_at": "2025-06-03T07:18:29.640606+00:00"} {"global_step": 234401, "acc_step": 0, "speed/wps": 5533.159398992138, "speed/FLOPS": 244537324158262.53, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045752283185720444, "optim/lr": 1.631723543465036e-05, "optim/total_tokens": 1966298103808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2694591283798218, "created_at": "2025-06-03T07:18:32.604719+00:00"} {"global_step": 234402, "acc_step": 0, "speed/wps": 5527.905500961499, "speed/FLOPS": 244305128757196.16, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046115364879369736, "optim/lr": 1.631368820955581e-05, "optim/total_tokens": 1966306492416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2484623193740845, "created_at": "2025-06-03T07:18:35.571684+00:00"} {"global_step": 234403, "acc_step": 0, "speed/wps": 5527.8647306829225, "speed/FLOPS": 244303326919564.3, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046098873019218445, "optim/lr": 1.6310140984461486e-05, "optim/total_tokens": 1966314881024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.262267827987671, "created_at": "2025-06-03T07:18:38.542874+00:00"} {"global_step": 234404, "acc_step": 0, "speed/wps": 5537.15661259012, "speed/FLOPS": 244713980539699.4, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04770483076572418, "optim/lr": 1.630659375936694e-05, "optim/total_tokens": 1966323269632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2687206268310547, "created_at": "2025-06-03T07:18:41.506538+00:00"} {"global_step": 234405, "acc_step": 0, "speed/wps": 5519.452063570333, "speed/FLOPS": 243931530093121.6, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047977514564991, "optim/lr": 1.6303046534272393e-05, "optim/total_tokens": 1966331658240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2754210233688354, "created_at": "2025-06-03T07:18:44.478260+00:00"} {"global_step": 234406, "acc_step": 0, "speed/wps": 5532.899032625467, "speed/FLOPS": 244525817297531.5, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04740852862596512, "optim/lr": 1.6299499309177847e-05, "optim/total_tokens": 1966340046848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2565996646881104, "created_at": "2025-06-03T07:18:47.442408+00:00"} {"global_step": 234407, "acc_step": 0, "speed/wps": 5523.184681933037, "speed/FLOPS": 244096492719480.4, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04881507158279419, "optim/lr": 1.629595208408352e-05, "optim/total_tokens": 1966348435456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2633484601974487, "created_at": "2025-06-03T07:18:50.412422+00:00"} {"global_step": 234408, "acc_step": 0, "speed/wps": 5514.464477994859, "speed/FLOPS": 243711104339462.88, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044880371540784836, "optim/lr": 1.6292404858988974e-05, "optim/total_tokens": 1966356824064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2748136520385742, "created_at": "2025-06-03T07:18:53.392467+00:00"} {"global_step": 234409, "acc_step": 0, "speed/wps": 5516.4844622570345, "speed/FLOPS": 243800377304634.3, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045487526804208755, "optim/lr": 1.6288857633894428e-05, "optim/total_tokens": 1966365212672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2616597414016724, "created_at": "2025-06-03T07:18:56.368690+00:00"} {"global_step": 234410, "acc_step": 0, "speed/wps": 5516.072319782399, "speed/FLOPS": 243782162716791.84, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.79 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.79, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04605385288596153, "optim/lr": 1.628531040879988e-05, "optim/total_tokens": 1966373601280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2595500946044922, "created_at": "2025-06-03T07:18:59.343010+00:00"} {"global_step": 234411, "acc_step": 0, "speed/wps": 5517.350782208058, "speed/FLOPS": 243838664212242.06, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0454820916056633, "optim/lr": 1.6281763183705555e-05, "optim/total_tokens": 1966381989888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.271809697151184, "created_at": "2025-06-03T07:19:02.320052+00:00"} {"global_step": 234412, "acc_step": 0, "speed/wps": 5532.562420561984, "speed/FLOPS": 244510940767262.3, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04571416601538658, "optim/lr": 1.627821595861101e-05, "optim/total_tokens": 1966390378496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2689017057418823, "created_at": "2025-06-03T07:19:05.285263+00:00"} {"global_step": 234413, "acc_step": 0, "speed/wps": 5530.452454336658, "speed/FLOPS": 244417691059889.03, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046416595578193665, "optim/lr": 1.6274668733516462e-05, "optim/total_tokens": 1966398767104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2792714834213257, "created_at": "2025-06-03T07:19:08.251440+00:00"} {"global_step": 234414, "acc_step": 0, "speed/wps": 5519.450201995752, "speed/FLOPS": 243931447821053.53, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04554874822497368, "optim/lr": 1.6271121508421916e-05, "optim/total_tokens": 1966407155712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.270469069480896, "created_at": "2025-06-03T07:19:11.226217+00:00"} {"global_step": 234415, "acc_step": 0, "speed/wps": 5510.577499453971, "speed/FLOPS": 243539319783315.34, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045660726726055145, "optim/lr": 1.626757428332759e-05, "optim/total_tokens": 1966415544320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2818282842636108, "created_at": "2025-06-03T07:19:14.207211+00:00"} {"global_step": 234416, "acc_step": 0, "speed/wps": 5527.498874668022, "speed/FLOPS": 244287157956326.53, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0450817234814167, "optim/lr": 1.6264027058233043e-05, "optim/total_tokens": 1966423932928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.273909091949463, "created_at": "2025-06-03T07:19:17.175133+00:00"} {"global_step": 234417, "acc_step": 0, "speed/wps": 5523.632599761673, "speed/FLOPS": 244116288394854.84, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04616541415452957, "optim/lr": 1.6260479833138497e-05, "optim/total_tokens": 1966432321536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2746528387069702, "created_at": "2025-06-03T07:19:20.149007+00:00"} {"global_step": 234418, "acc_step": 0, "speed/wps": 5512.940811918495, "speed/FLOPS": 243643766097717.53, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.047641631215810776, "optim/lr": 1.625693260804395e-05, "optim/total_tokens": 1966440710144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2507641315460205, "created_at": "2025-06-03T07:19:23.124459+00:00"} {"global_step": 234419, "acc_step": 0, "speed/wps": 5535.326805388026, "speed/FLOPS": 244633112427169.12, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04689669609069824, "optim/lr": 1.6253385382949625e-05, "optim/total_tokens": 1966449098752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.274361252784729, "created_at": "2025-06-03T07:19:26.093581+00:00"} {"global_step": 234420, "acc_step": 0, "speed/wps": 5521.76543213783, "speed/FLOPS": 244033769142911.25, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05083153024315834, "optim/lr": 1.6249838157855078e-05, "optim/total_tokens": 1966457487360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2830185890197754, "created_at": "2025-06-03T07:19:29.065096+00:00"} {"global_step": 234421, "acc_step": 0, "speed/wps": 5524.10516014611, "speed/FLOPS": 244137173145063.66, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04851318895816803, "optim/lr": 1.6246290932760532e-05, "optim/total_tokens": 1966465875968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.269997239112854, "created_at": "2025-06-03T07:19:32.034627+00:00"} {"global_step": 234422, "acc_step": 0, "speed/wps": 5524.98450294777, "speed/FLOPS": 244176035596012.53, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04743616282939911, "optim/lr": 1.6242743707665985e-05, "optim/total_tokens": 1966474264576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2536005973815918, "created_at": "2025-06-03T07:19:35.003809+00:00"} {"global_step": 234423, "acc_step": 0, "speed/wps": 5514.009372803139, "speed/FLOPS": 243690991019428.38, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04881609231233597, "optim/lr": 1.6239196482571663e-05, "optim/total_tokens": 1966482653184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2561240196228027, "created_at": "2025-06-03T07:19:37.982191+00:00"} {"global_step": 234424, "acc_step": 0, "speed/wps": 5511.60787971586, "speed/FLOPS": 243584857316926.56, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04674028605222702, "optim/lr": 1.6235649257477113e-05, "optim/total_tokens": 1966491041792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2813129425048828, "created_at": "2025-06-03T07:19:40.962946+00:00"} {"global_step": 234425, "acc_step": 0, "speed/wps": 5499.2268964668165, "speed/FLOPS": 243037681228935.9, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04757697880268097, "optim/lr": 1.6232102032382566e-05, "optim/total_tokens": 1966499430400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2734638452529907, "created_at": "2025-06-03T07:19:43.946258+00:00"} {"global_step": 234426, "acc_step": 0, "speed/wps": 5508.52238230581, "speed/FLOPS": 243448494124409.78, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.78 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.78, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04809273034334183, "optim/lr": 1.622855480728802e-05, "optim/total_tokens": 1966507819008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2774180173873901, "created_at": "2025-06-03T07:19:46.924406+00:00"} {"global_step": 234427, "acc_step": 0, "speed/wps": 5530.646615350068, "speed/FLOPS": 244426271982875.6, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049926478415727615, "optim/lr": 1.6225007582193697e-05, "optim/total_tokens": 1966516207616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2718433141708374, "created_at": "2025-06-03T07:19:49.892448+00:00"} {"global_step": 234428, "acc_step": 0, "speed/wps": 5517.758412751452, "speed/FLOPS": 243856679395817.8, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04743831232190132, "optim/lr": 1.622146035709915e-05, "optim/total_tokens": 1966524596224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2695457935333252, "created_at": "2025-06-03T07:19:52.865695+00:00"} {"global_step": 234429, "acc_step": 0, "speed/wps": 5511.88527097174, "speed/FLOPS": 243597116590619.3, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04878680035471916, "optim/lr": 1.62179131320046e-05, "optim/total_tokens": 1966532984832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.262821078300476, "created_at": "2025-06-03T07:19:55.841836+00:00"} {"global_step": 234430, "acc_step": 0, "speed/wps": 5524.689265471958, "speed/FLOPS": 244162987610744.03, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045260198414325714, "optim/lr": 1.6214365906910278e-05, "optim/total_tokens": 1966541373440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2745566368103027, "created_at": "2025-06-03T07:19:58.811394+00:00"} {"global_step": 234431, "acc_step": 0, "speed/wps": 5523.788465519261, "speed/FLOPS": 244123176863546.97, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04761701077222824, "optim/lr": 1.6210818681815732e-05, "optim/total_tokens": 1966549762048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2651524543762207, "created_at": "2025-06-03T07:20:01.781182+00:00"} {"global_step": 234432, "acc_step": 0, "speed/wps": 5526.468176754964, "speed/FLOPS": 244241606384159.53, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04492746293544769, "optim/lr": 1.6207271456721185e-05, "optim/total_tokens": 1966558150656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2732669115066528, "created_at": "2025-06-03T07:20:04.749309+00:00"} {"global_step": 234433, "acc_step": 0, "speed/wps": 5516.056330314696, "speed/FLOPS": 243781456064160.9, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04649772122502327, "optim/lr": 1.620372423162664e-05, "optim/total_tokens": 1966566539264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2812979221343994, "created_at": "2025-06-03T07:20:07.724731+00:00"} {"global_step": 234434, "acc_step": 0, "speed/wps": 5503.107739711437, "speed/FLOPS": 243209194636391.7, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04826227203011513, "optim/lr": 1.6200177006532313e-05, "optim/total_tokens": 1966574927872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2784711122512817, "created_at": "2025-06-03T07:20:10.705601+00:00"} {"global_step": 234435, "acc_step": 0, "speed/wps": 5506.493374249827, "speed/FLOPS": 243358822353740.0, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046966779977083206, "optim/lr": 1.6196629781437767e-05, "optim/total_tokens": 1966583316480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2719091176986694, "created_at": "2025-06-03T07:20:13.685101+00:00"} {"global_step": 234436, "acc_step": 0, "speed/wps": 5529.423250382471, "speed/FLOPS": 244372205513057.4, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04939872771501541, "optim/lr": 1.619308255634322e-05, "optim/total_tokens": 1966591705088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2712531089782715, "created_at": "2025-06-03T07:20:16.651923+00:00"} {"global_step": 234437, "acc_step": 0, "speed/wps": 5530.935378183154, "speed/FLOPS": 244439033822075.84, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.049239758402109146, "optim/lr": 1.6189535331248674e-05, "optim/total_tokens": 1966600093696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2658843994140625, "created_at": "2025-06-03T07:20:19.621251+00:00"} {"global_step": 234438, "acc_step": 0, "speed/wps": 5513.684930276456, "speed/FLOPS": 243676652320396.38, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04911968857049942, "optim/lr": 1.6185988106154348e-05, "optim/total_tokens": 1966608482304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2715882062911987, "created_at": "2025-06-03T07:20:22.602178+00:00"} {"global_step": 234439, "acc_step": 0, "speed/wps": 5524.383477285956, "speed/FLOPS": 244149473338088.6, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.053047873079776764, "optim/lr": 1.61824408810598e-05, "optim/total_tokens": 1966616870912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2720091342926025, "created_at": "2025-06-03T07:20:25.575060+00:00"} {"global_step": 234440, "acc_step": 0, "speed/wps": 5535.990934191974, "speed/FLOPS": 244662463520984.25, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 192.66, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046121709048748016, "optim/lr": 1.6178893655965255e-05, "optim/total_tokens": 1966625259520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.264719009399414, "created_at": "2025-06-03T07:20:28.542116+00:00"} {"global_step": 234441, "acc_step": 0, "speed/wps": 5509.788394386237, "speed/FLOPS": 243504445378327.4, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05377667769789696, "optim/lr": 1.617534643087071e-05, "optim/total_tokens": 1966633648128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2607269287109375, "created_at": "2025-06-03T07:20:31.522702+00:00"} {"global_step": 234442, "acc_step": 0, "speed/wps": 5498.84828381952, "speed/FLOPS": 243020948487840.56, "speed/curr_iter_time": 2.9767, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9767, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.77 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.77, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04581844061613083, "optim/lr": 1.6171799205776382e-05, "optim/total_tokens": 1966642036736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2745013236999512, "created_at": "2025-06-03T07:20:34.509135+00:00"} {"global_step": 234443, "acc_step": 0, "speed/wps": 5520.903556909531, "speed/FLOPS": 243995678669297.78, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04787982255220413, "optim/lr": 1.6168251980681836e-05, "optim/total_tokens": 1966650425344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2716262340545654, "created_at": "2025-06-03T07:20:37.481983+00:00"} {"global_step": 234444, "acc_step": 0, "speed/wps": 5517.592852600798, "speed/FLOPS": 243849362484572.6, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04588455706834793, "optim/lr": 1.616470475558729e-05, "optim/total_tokens": 1966658813952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2729146480560303, "created_at": "2025-06-03T07:20:40.457573+00:00"} {"global_step": 234445, "acc_step": 0, "speed/wps": 5525.710203452468, "speed/FLOPS": 244208107843848.28, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045470017939805984, "optim/lr": 1.6161157530492743e-05, "optim/total_tokens": 1966667202560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2532539367675781, "created_at": "2025-06-03T07:20:43.426767+00:00"} {"global_step": 234446, "acc_step": 0, "speed/wps": 5524.819414153817, "speed/FLOPS": 244168739516320.88, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.044569868594408035, "optim/lr": 1.6157610305398417e-05, "optim/total_tokens": 1966675591168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2630969285964966, "created_at": "2025-06-03T07:20:46.397986+00:00"} {"global_step": 234447, "acc_step": 0, "speed/wps": 5514.998188784825, "speed/FLOPS": 243734691624599.9, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045203469693660736, "optim/lr": 1.615406308030387e-05, "optim/total_tokens": 1966683979776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2751184701919556, "created_at": "2025-06-03T07:20:49.375214+00:00"} {"global_step": 234448, "acc_step": 0, "speed/wps": 5521.154501612496, "speed/FLOPS": 244006769140717.38, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04476429522037506, "optim/lr": 1.6150515855209324e-05, "optim/total_tokens": 1966692368384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2840602397918701, "created_at": "2025-06-03T07:20:52.346736+00:00"} {"global_step": 234449, "acc_step": 0, "speed/wps": 5524.082923289061, "speed/FLOPS": 244136190389800.62, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0460345484316349, "optim/lr": 1.6146968630114778e-05, "optim/total_tokens": 1966700756992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.270723819732666, "created_at": "2025-06-03T07:20:55.319830+00:00"} {"global_step": 234450, "acc_step": 0, "speed/wps": 5512.004861610819, "speed/FLOPS": 243602401884746.22, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046247296035289764, "optim/lr": 1.614342140502045e-05, "optim/total_tokens": 1966709145600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2655256986618042, "created_at": "2025-06-03T07:20:58.299726+00:00"} {"global_step": 234451, "acc_step": 0, "speed/wps": 5510.559282762674, "speed/FLOPS": 243538514698801.5, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0448138490319252, "optim/lr": 1.6139874179925905e-05, "optim/total_tokens": 1966717534208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2681536674499512, "created_at": "2025-06-03T07:21:01.276490+00:00"} {"global_step": 234452, "acc_step": 0, "speed/wps": 5515.978519889313, "speed/FLOPS": 243778017241628.8, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0461517795920372, "optim/lr": 1.613632695483136e-05, "optim/total_tokens": 1966725922816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2572933435440063, "created_at": "2025-06-03T07:21:04.253796+00:00"} {"global_step": 234453, "acc_step": 0, "speed/wps": 5525.859826362314, "speed/FLOPS": 244214720410624.0, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04532179608941078, "optim/lr": 1.6132779729736812e-05, "optim/total_tokens": 1966734311424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.27128267288208, "created_at": "2025-06-03T07:21:07.223403+00:00"} {"global_step": 234454, "acc_step": 0, "speed/wps": 5533.20204778673, "speed/FLOPS": 244539209016687.16, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 192.76, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04790108650922775, "optim/lr": 1.612923250464249e-05, "optim/total_tokens": 1966742700032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2833678722381592, "created_at": "2025-06-03T07:21:10.188481+00:00"} {"global_step": 234455, "acc_step": 0, "speed/wps": 5522.67290639647, "speed/FLOPS": 244073874860268.8, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04567365348339081, "optim/lr": 1.612568527954794e-05, "optim/total_tokens": 1966751088640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2796179056167603, "created_at": "2025-06-03T07:21:13.161484+00:00"} {"global_step": 234456, "acc_step": 0, "speed/wps": 5520.99074099458, "speed/FLOPS": 243999531759608.3, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04510483890771866, "optim/lr": 1.6122138054453393e-05, "optim/total_tokens": 1966759477248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2717105150222778, "created_at": "2025-06-03T07:21:16.132527+00:00"} {"global_step": 234457, "acc_step": 0, "speed/wps": 5501.194687296365, "speed/FLOPS": 243124647511535.44, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.76 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.76, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04533438757061958, "optim/lr": 1.611859082935907e-05, "optim/total_tokens": 1966767865856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2780139446258545, "created_at": "2025-06-03T07:21:19.119355+00:00"} {"global_step": 234458, "acc_step": 0, "speed/wps": 5521.563728601334, "speed/FLOPS": 244024854879010.44, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0449911430478096, "optim/lr": 1.6115043604264524e-05, "optim/total_tokens": 1966776254464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2601516246795654, "created_at": "2025-06-03T07:21:22.093961+00:00"} {"global_step": 234459, "acc_step": 0, "speed/wps": 5508.973544638088, "speed/FLOPS": 243468433190238.3, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.75 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.75, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04672092944383621, "optim/lr": 1.6111496379169978e-05, "optim/total_tokens": 1966784643072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2647286653518677, "created_at": "2025-06-03T07:21:25.071600+00:00"} {"global_step": 234460, "acc_step": 0, "speed/wps": 5520.385708796272, "speed/FLOPS": 243972792433278.66, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04577646404504776, "optim/lr": 1.6107949154075428e-05, "optim/total_tokens": 1966793031680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 357, "loss/out": 1.2764348983764648, "created_at": "2025-06-03T07:21:28.044281+00:00"} {"global_step": 234461, "acc_step": 0, "speed/wps": 5523.674868116253, "speed/FLOPS": 244118156439778.22, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.045257922261953354, "optim/lr": 1.6104401928981105e-05, "optim/total_tokens": 1966801420288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.272991418838501, "created_at": "2025-06-03T07:21:31.019996+00:00"} {"global_step": 234462, "acc_step": 0, "speed/wps": 5521.62551026882, "speed/FLOPS": 244027585312486.06, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04527318477630615, "optim/lr": 1.610085470388656e-05, "optim/total_tokens": 1966809808896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2860424518585205, "created_at": "2025-06-03T07:21:33.991182+00:00"} {"global_step": 234463, "acc_step": 0, "speed/wps": 5523.962149293181, "speed/FLOPS": 244130852797360.1, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04581483080983162, "optim/lr": 1.6097307478792012e-05, "optim/total_tokens": 1966818197504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2830466032028198, "created_at": "2025-06-03T07:21:36.961514+00:00"} {"global_step": 234464, "acc_step": 0, "speed/wps": 5511.666665088069, "speed/FLOPS": 243587455329487.38, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046873610466718674, "optim/lr": 1.6093760253697466e-05, "optim/total_tokens": 1966826586112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2675095796585083, "created_at": "2025-06-03T07:21:39.937806+00:00"} {"global_step": 234465, "acc_step": 0, "speed/wps": 5515.976690923636, "speed/FLOPS": 243777936410707.38, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04582550376653671, "optim/lr": 1.609021302860314e-05, "optim/total_tokens": 1966834974720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2601344585418701, "created_at": "2025-06-03T07:21:42.911955+00:00"} {"global_step": 234466, "acc_step": 0, "speed/wps": 5510.463822520397, "speed/FLOPS": 243534295844702.7, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04529435932636261, "optim/lr": 1.6086665803508594e-05, "optim/total_tokens": 1966843363328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.27399480342865, "created_at": "2025-06-03T07:21:45.888619+00:00"} {"global_step": 234467, "acc_step": 0, "speed/wps": 5511.858024104778, "speed/FLOPS": 243595912418561.72, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046731237322092056, "optim/lr": 1.6083118578414047e-05, "optim/total_tokens": 1966851751936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2648111581802368, "created_at": "2025-06-03T07:21:48.868384+00:00"} {"global_step": 234468, "acc_step": 0, "speed/wps": 5516.466763061952, "speed/FLOPS": 243799595090804.38, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04482872411608696, "optim/lr": 1.60795713533195e-05, "optim/total_tokens": 1966860140544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.281999111175537, "created_at": "2025-06-03T07:21:51.845854+00:00"} {"global_step": 234469, "acc_step": 0, "speed/wps": 5511.55912626242, "speed/FLOPS": 243582702663827.34, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0480387844145298, "optim/lr": 1.6076024128225175e-05, "optim/total_tokens": 1966868529152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.282004952430725, "created_at": "2025-06-03T07:21:54.827685+00:00"} {"global_step": 234470, "acc_step": 0, "speed/wps": 5518.5520352746735, "speed/FLOPS": 243891753449215.88, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0460418276488781, "optim/lr": 1.6072476903130628e-05, "optim/total_tokens": 1966876917760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2633143663406372, "created_at": "2025-06-03T07:21:57.801565+00:00"} {"global_step": 234471, "acc_step": 0, "speed/wps": 5518.465473050098, "speed/FLOPS": 243887927841955.28, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046718284487724304, "optim/lr": 1.6068929678036082e-05, "optim/total_tokens": 1966885306368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.281985878944397, "created_at": "2025-06-03T07:22:00.774251+00:00"} {"global_step": 234472, "acc_step": 0, "speed/wps": 5517.791551154902, "speed/FLOPS": 243858143943632.56, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04670184850692749, "optim/lr": 1.6065382452941535e-05, "optim/total_tokens": 1966893694976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2714455127716064, "created_at": "2025-06-03T07:22:03.750617+00:00"} {"global_step": 234473, "acc_step": 0, "speed/wps": 5545.289676826456, "speed/FLOPS": 245073420350148.97, "speed/curr_iter_time": 2.9536, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9536, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 192.37, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04637527838349342, "optim/lr": 1.606183522784721e-05, "optim/total_tokens": 1966902083584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.261560082435608, "created_at": "2025-06-03T07:22:06.712152+00:00"} {"global_step": 234474, "acc_step": 0, "speed/wps": 5518.079513604929, "speed/FLOPS": 243870870409998.34, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04603102058172226, "optim/lr": 1.6058288002752663e-05, "optim/total_tokens": 1966910472192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2800606489181519, "created_at": "2025-06-03T07:22:09.685054+00:00"} {"global_step": 234475, "acc_step": 0, "speed/wps": 5507.208615871397, "speed/FLOPS": 243390432372474.94, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0455450564622879, "optim/lr": 1.6054740777658116e-05, "optim/total_tokens": 1966918860800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2820558547973633, "created_at": "2025-06-03T07:22:12.663909+00:00"} {"global_step": 234476, "acc_step": 0, "speed/wps": 5505.4166618065265, "speed/FLOPS": 243311237174860.0, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.05060894787311554, "optim/lr": 1.605119355256357e-05, "optim/total_tokens": 1966927249408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2774940729141235, "created_at": "2025-06-03T07:22:15.643626+00:00"} {"global_step": 234477, "acc_step": 0, "speed/wps": 5504.57454611534, "speed/FLOPS": 243274019971648.44, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.74 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.74, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04538217931985855, "optim/lr": 1.6047646327469244e-05, "optim/total_tokens": 1966935638016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2819533348083496, "created_at": "2025-06-03T07:22:18.630641+00:00"} {"global_step": 234478, "acc_step": 0, "speed/wps": 5521.939455393044, "speed/FLOPS": 244041460080059.94, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.046476271003484726, "optim/lr": 1.6044099102374697e-05, "optim/total_tokens": 1966944026624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2544782161712646, "created_at": "2025-06-03T07:22:21.601843+00:00"} {"global_step": 234479, "acc_step": 0, "speed/wps": 5523.66231319494, "speed/FLOPS": 244117601576518.1, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04636511206626892, "optim/lr": 1.604055187728015e-05, "optim/total_tokens": 1966952415232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.278179407119751, "created_at": "2025-06-03T07:22:24.571903+00:00"} {"global_step": 234480, "acc_step": 0, "speed/wps": 5513.002230163425, "speed/FLOPS": 243646480469776.38, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04776358604431152, "optim/lr": 1.6037004652185605e-05, "optim/total_tokens": 1966960803840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2608872652053833, "created_at": "2025-06-03T07:22:27.547612+00:00"} {"global_step": 234481, "acc_step": 0, "speed/wps": 5518.167461849142, "speed/FLOPS": 243874757272232.62, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04563846066594124, "optim/lr": 1.6033457427091282e-05, "optim/total_tokens": 1966969192448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2649061679840088, "created_at": "2025-06-03T07:22:30.522499+00:00"} {"global_step": 234482, "acc_step": 0, "speed/wps": 5519.171299494687, "speed/FLOPS": 243919121758058.88, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04974077641963959, "optim/lr": 1.6029910201996732e-05, "optim/total_tokens": 1966977581056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2666047811508179, "created_at": "2025-06-03T07:22:33.494921+00:00"} {"global_step": 234483, "acc_step": 0, "speed/wps": 5524.955661950989, "speed/FLOPS": 244174760971576.44, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045125823467969894, "optim/lr": 1.6026362976902186e-05, "optim/total_tokens": 1966985969664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.280914068222046, "created_at": "2025-06-03T07:22:36.467470+00:00"} {"global_step": 234484, "acc_step": 0, "speed/wps": 5514.965941451521, "speed/FLOPS": 243733266457524.7, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04810012876987457, "optim/lr": 1.6022815751807863e-05, "optim/total_tokens": 1966994358272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.264528512954712, "created_at": "2025-06-03T07:22:39.442885+00:00"} {"global_step": 234485, "acc_step": 0, "speed/wps": 5513.38939588988, "speed/FLOPS": 243663591213191.84, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04517469182610512, "optim/lr": 1.6019268526713317e-05, "optim/total_tokens": 1967002746880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2682709693908691, "created_at": "2025-06-03T07:22:42.418702+00:00"} {"global_step": 234486, "acc_step": 0, "speed/wps": 5523.432742413326, "speed/FLOPS": 244107455723020.56, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04544807970523834, "optim/lr": 1.601572130161877e-05, "optim/total_tokens": 1967011135488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2769935131072998, "created_at": "2025-06-03T07:22:45.388552+00:00"} {"global_step": 234487, "acc_step": 0, "speed/wps": 5529.040247836106, "speed/FLOPS": 244355278760892.78, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04517337679862976, "optim/lr": 1.601217407652422e-05, "optim/total_tokens": 1967019524096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2751243114471436, "created_at": "2025-06-03T07:22:48.357192+00:00"} {"global_step": 234488, "acc_step": 0, "speed/wps": 5521.411604986011, "speed/FLOPS": 244018131793852.4, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046197809278964996, "optim/lr": 1.6008626851429898e-05, "optim/total_tokens": 1967027912704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2847039699554443, "created_at": "2025-06-03T07:22:51.330034+00:00"} {"global_step": 234489, "acc_step": 0, "speed/wps": 5514.246084896926, "speed/FLOPS": 243701452482371.44, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045234885066747665, "optim/lr": 1.600507962633535e-05, "optim/total_tokens": 1967036301312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.270516276359558, "created_at": "2025-06-03T07:22:54.305793+00:00"} {"global_step": 234490, "acc_step": 0, "speed/wps": 5520.4925862780165, "speed/FLOPS": 243977515870923.2, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04537983238697052, "optim/lr": 1.6001532401240805e-05, "optim/total_tokens": 1967044689920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2597832679748535, "created_at": "2025-06-03T07:22:57.280340+00:00"} {"global_step": 234491, "acc_step": 0, "speed/wps": 5505.308671134951, "speed/FLOPS": 243306464539922.72, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.73 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.73, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04633454978466034, "optim/lr": 1.599798517614626e-05, "optim/total_tokens": 1967053078528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2744706869125366, "created_at": "2025-06-03T07:23:00.259367+00:00"} {"global_step": 234492, "acc_step": 0, "speed/wps": 5508.067458867817, "speed/FLOPS": 243428388836959.72, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.04582114890217781, "optim/lr": 1.5994437951051932e-05, "optim/total_tokens": 1967061467136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2698673009872437, "created_at": "2025-06-03T07:23:03.237827+00:00"} {"global_step": 234493, "acc_step": 0, "speed/wps": 5512.263654224379, "speed/FLOPS": 243613839193644.9, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04572056606411934, "optim/lr": 1.5990890725957386e-05, "optim/total_tokens": 1967069855744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2778843641281128, "created_at": "2025-06-03T07:23:06.213655+00:00"} {"global_step": 234494, "acc_step": 0, "speed/wps": 5506.290269946543, "speed/FLOPS": 243349846183116.94, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.16, "optim/grad_norm": 0.0469428114593029, "optim/lr": 1.598734350086284e-05, "optim/total_tokens": 1967078244352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2627791166305542, "created_at": "2025-06-03T07:23:09.193213+00:00"} {"global_step": 234495, "acc_step": 0, "speed/wps": 5534.024811548544, "speed/FLOPS": 244575570963672.62, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 192.77, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04556262493133545, "optim/lr": 1.5983796275768293e-05, "optim/total_tokens": 1967086632960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2666760683059692, "created_at": "2025-06-03T07:23:12.158216+00:00"} {"global_step": 234496, "acc_step": 0, "speed/wps": 5523.925397902453, "speed/FLOPS": 244129228574000.6, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04692856967449188, "optim/lr": 1.5980249050673967e-05, "optim/total_tokens": 1967095021568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2538607120513916, "created_at": "2025-06-03T07:23:15.132284+00:00"} {"global_step": 234497, "acc_step": 0, "speed/wps": 5519.312690088037, "speed/FLOPS": 243925370498582.28, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04733963683247566, "optim/lr": 1.597670182557942e-05, "optim/total_tokens": 1967103410176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2662229537963867, "created_at": "2025-06-03T07:23:18.104263+00:00"} {"global_step": 234498, "acc_step": 0, "speed/wps": 5511.46564124297, "speed/FLOPS": 243578571104467.34, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04640738666057587, "optim/lr": 1.5973154600484874e-05, "optim/total_tokens": 1967111798784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2650176286697388, "created_at": "2025-06-03T07:23:21.080756+00:00"} {"global_step": 234499, "acc_step": 0, "speed/wps": 5507.041578551731, "speed/FLOPS": 243383050177920.2, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.72 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.72, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049763236194849014, "optim/lr": 1.5969607375390328e-05, "optim/total_tokens": 1967120187392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2814604043960571, "created_at": "2025-06-03T07:23:24.064861+00:00"} {"global_step": 234500, "acc_step": 0, "speed/wps": 5515.480303889382, "speed/FLOPS": 243755998644532.53, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04595956206321716, "optim/lr": 1.5966060150296e-05, "optim/total_tokens": 1967128576000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.253757357597351, "created_at": "2025-06-03T07:23:27.045334+00:00"} {"global_step": 234501, "acc_step": 0, "speed/wps": 5520.025484405416, "speed/FLOPS": 243956872358998.38, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04835947975516319, "optim/lr": 1.5962512925201455e-05, "optim/total_tokens": 1967136964608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2726500034332275, "created_at": "2025-06-03T07:23:30.020811+00:00"} {"global_step": 234502, "acc_step": 0, "speed/wps": 5536.664412389742, "speed/FLOPS": 244692227810151.72, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 192.58, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04883456230163574, "optim/lr": 1.595896570010691e-05, "optim/total_tokens": 1967145353216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2560999393463135, "created_at": "2025-06-03T07:23:32.987546+00:00"} {"global_step": 234503, "acc_step": 0, "speed/wps": 5522.053887525666, "speed/FLOPS": 244046517394605.1, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04721580073237419, "optim/lr": 1.5955418475012362e-05, "optim/total_tokens": 1967153741824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2645490169525146, "created_at": "2025-06-03T07:23:35.960831+00:00"} {"global_step": 234504, "acc_step": 0, "speed/wps": 5521.484983317847, "speed/FLOPS": 244021374740535.2, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05042681843042374, "optim/lr": 1.5951871249918036e-05, "optim/total_tokens": 1967162130432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2780091762542725, "created_at": "2025-06-03T07:23:38.932026+00:00"} {"global_step": 234505, "acc_step": 0, "speed/wps": 5517.137275039734, "speed/FLOPS": 243829228288230.9, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04923676699399948, "optim/lr": 1.594832402482349e-05, "optim/total_tokens": 1967170519040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2781237363815308, "created_at": "2025-06-03T07:23:41.905532+00:00"} {"global_step": 234506, "acc_step": 0, "speed/wps": 5514.396629446782, "speed/FLOPS": 243708105780918.22, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.71 hours", "speed/est_time_elapsed_hrs": 193.36, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.71, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04922376573085785, "optim/lr": 1.5944776799728943e-05, "optim/total_tokens": 1967178907648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2679145336151123, "created_at": "2025-06-03T07:23:44.884171+00:00"} {"global_step": 234507, "acc_step": 0, "speed/wps": 5517.834862461067, "speed/FLOPS": 243860058081677.72, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04496780410408974, "optim/lr": 1.5941229574634397e-05, "optim/total_tokens": 1967187296256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2709084749221802, "created_at": "2025-06-03T07:23:47.857149+00:00"} {"global_step": 234508, "acc_step": 0, "speed/wps": 5518.401066416592, "speed/FLOPS": 243885081398417.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05129396542906761, "optim/lr": 1.593768234954007e-05, "optim/total_tokens": 1967195684864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2721257209777832, "created_at": "2025-06-03T07:23:50.830323+00:00"} {"global_step": 234509, "acc_step": 0, "speed/wps": 5515.951466886671, "speed/FLOPS": 243776821637381.88, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04715932533144951, "optim/lr": 1.5934135124445524e-05, "optim/total_tokens": 1967204073472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2754905223846436, "created_at": "2025-06-03T07:23:53.804491+00:00"} {"global_step": 234510, "acc_step": 0, "speed/wps": 5514.105452827338, "speed/FLOPS": 243695237264715.84, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045458026230335236, "optim/lr": 1.5930587899350978e-05, "optim/total_tokens": 1967212462080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2831612825393677, "created_at": "2025-06-03T07:23:56.779280+00:00"} {"global_step": 234511, "acc_step": 0, "speed/wps": 5520.340293020152, "speed/FLOPS": 243970785288433.12, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047571536153554916, "optim/lr": 1.5927040674256655e-05, "optim/total_tokens": 1967220850688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2749145030975342, "created_at": "2025-06-03T07:23:59.750793+00:00"} {"global_step": 234512, "acc_step": 0, "speed/wps": 5529.974049665222, "speed/FLOPS": 244396548022108.66, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04496213048696518, "optim/lr": 1.592349344916211e-05, "optim/total_tokens": 1967229239296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2734295129776, "created_at": "2025-06-03T07:24:02.717802+00:00"} {"global_step": 234513, "acc_step": 0, "speed/wps": 5522.469595394235, "speed/FLOPS": 244064889554610.06, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04899187758564949, "optim/lr": 1.591994622406756e-05, "optim/total_tokens": 1967237627904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2778948545455933, "created_at": "2025-06-03T07:24:05.688123+00:00"} {"global_step": 234514, "acc_step": 0, "speed/wps": 5515.479460469027, "speed/FLOPS": 243755961369669.84, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.044785212725400925, "optim/lr": 1.5916398998973013e-05, "optim/total_tokens": 1967246016512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2718764543533325, "created_at": "2025-06-03T07:24:08.662103+00:00"} {"global_step": 234515, "acc_step": 0, "speed/wps": 5513.754869191618, "speed/FLOPS": 243679743262466.75, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.044809505343437195, "optim/lr": 1.591285177387869e-05, "optim/total_tokens": 1967254405120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2490079402923584, "created_at": "2025-06-03T07:24:11.641494+00:00"} {"global_step": 234516, "acc_step": 0, "speed/wps": 5522.348510125335, "speed/FLOPS": 244059538205495.28, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04539894312620163, "optim/lr": 1.5909304548784144e-05, "optim/total_tokens": 1967262793728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2785600423812866, "created_at": "2025-06-03T07:24:14.615971+00:00"} {"global_step": 234517, "acc_step": 0, "speed/wps": 5513.96401305799, "speed/FLOPS": 243688986350865.03, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.7 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.7, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04543633759021759, "optim/lr": 1.5905757323689597e-05, "optim/total_tokens": 1967271182336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2679263353347778, "created_at": "2025-06-03T07:24:17.591242+00:00"} {"global_step": 234518, "acc_step": 0, "speed/wps": 5518.438887701974, "speed/FLOPS": 243886752905644.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05272815749049187, "optim/lr": 1.5902210098595047e-05, "optim/total_tokens": 1967279570944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2553478479385376, "created_at": "2025-06-03T07:24:20.568204+00:00"} {"global_step": 234519, "acc_step": 0, "speed/wps": 5517.0838442732465, "speed/FLOPS": 243826866921835.6, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04503995180130005, "optim/lr": 1.5898662873500725e-05, "optim/total_tokens": 1967287959552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.272908091545105, "created_at": "2025-06-03T07:24:23.545346+00:00"} {"global_step": 234520, "acc_step": 0, "speed/wps": 5520.800853236586, "speed/FLOPS": 243991139692638.62, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.050502240657806396, "optim/lr": 1.5895115648406178e-05, "optim/total_tokens": 1967296348160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2709753513336182, "created_at": "2025-06-03T07:24:26.518267+00:00"} {"global_step": 234521, "acc_step": 0, "speed/wps": 5518.37682419522, "speed/FLOPS": 243884010016315.66, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04577628895640373, "optim/lr": 1.5891568423311632e-05, "optim/total_tokens": 1967304736768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.262428879737854, "created_at": "2025-06-03T07:24:29.494290+00:00"} {"global_step": 234522, "acc_step": 0, "speed/wps": 5535.771857450215, "speed/FLOPS": 244652781450334.94, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04631052911281586, "optim/lr": 1.5888021198217085e-05, "optim/total_tokens": 1967313125376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.267787218093872, "created_at": "2025-06-03T07:24:32.458147+00:00"} {"global_step": 234523, "acc_step": 0, "speed/wps": 5521.971324577474, "speed/FLOPS": 244042868534890.47, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04874849319458008, "optim/lr": 1.588447397312276e-05, "optim/total_tokens": 1967321513984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2744580507278442, "created_at": "2025-06-03T07:24:35.432472+00:00"} {"global_step": 234524, "acc_step": 0, "speed/wps": 5517.627942377145, "speed/FLOPS": 243850913273081.34, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047886818647384644, "optim/lr": 1.5880926748028213e-05, "optim/total_tokens": 1967329902592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.277559518814087, "created_at": "2025-06-03T07:24:38.406173+00:00"} {"global_step": 234525, "acc_step": 0, "speed/wps": 5512.257805101115, "speed/FLOPS": 243613580692335.16, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04970024526119232, "optim/lr": 1.5877379522933666e-05, "optim/total_tokens": 1967338291200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2698560953140259, "created_at": "2025-06-03T07:24:41.383393+00:00"} {"global_step": 234526, "acc_step": 0, "speed/wps": 5518.200254223576, "speed/FLOPS": 243876206527336.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04581150785088539, "optim/lr": 1.587383229783912e-05, "optim/total_tokens": 1967346679808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.266648769378662, "created_at": "2025-06-03T07:24:44.358157+00:00"} {"global_step": 234527, "acc_step": 0, "speed/wps": 5516.059291768647, "speed/FLOPS": 243781586945267.44, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.06516790390014648, "optim/lr": 1.5870285072744794e-05, "optim/total_tokens": 1967355068416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2783514261245728, "created_at": "2025-06-03T07:24:47.334434+00:00"} {"global_step": 234528, "acc_step": 0, "speed/wps": 5527.6302955573665, "speed/FLOPS": 244292966086962.47, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04444374144077301, "optim/lr": 1.5866737847650248e-05, "optim/total_tokens": 1967363457024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.274253249168396, "created_at": "2025-06-03T07:24:50.302576+00:00"} {"global_step": 234529, "acc_step": 0, "speed/wps": 5526.607307661864, "speed/FLOPS": 244247755258108.0, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 192.94, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05230565369129181, "optim/lr": 1.58631906225557e-05, "optim/total_tokens": 1967371845632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.276465654373169, "created_at": "2025-06-03T07:24:53.271599+00:00"} {"global_step": 234530, "acc_step": 0, "speed/wps": 5512.805332692416, "speed/FLOPS": 243637778609370.4, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04807597026228905, "optim/lr": 1.5859643397461155e-05, "optim/total_tokens": 1967380234240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.268662691116333, "created_at": "2025-06-03T07:24:56.247206+00:00"} {"global_step": 234531, "acc_step": 0, "speed/wps": 5531.528229098897, "speed/FLOPS": 244465234798065.62, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04891841113567352, "optim/lr": 1.585609617236683e-05, "optim/total_tokens": 1967388622848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2696599960327148, "created_at": "2025-06-03T07:24:59.212458+00:00"} {"global_step": 234532, "acc_step": 0, "speed/wps": 5514.942003859497, "speed/FLOPS": 243732208538480.94, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04920458048582077, "optim/lr": 1.5852548947272282e-05, "optim/total_tokens": 1967397011456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2708860635757446, "created_at": "2025-06-03T07:25:02.186606+00:00"} {"global_step": 234533, "acc_step": 0, "speed/wps": 5518.615478571971, "speed/FLOPS": 243894557318224.2, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04631401598453522, "optim/lr": 1.5849001722177736e-05, "optim/total_tokens": 1967405400064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2711522579193115, "created_at": "2025-06-03T07:25:05.163661+00:00"} {"global_step": 234534, "acc_step": 0, "speed/wps": 5519.04830229341, "speed/FLOPS": 243913685911319.2, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04959350824356079, "optim/lr": 1.584545449708319e-05, "optim/total_tokens": 1967413788672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2669572830200195, "created_at": "2025-06-03T07:25:08.136302+00:00"} {"global_step": 234535, "acc_step": 0, "speed/wps": 5518.559446265671, "speed/FLOPS": 243892080977085.1, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04980163648724556, "optim/lr": 1.5841907271988863e-05, "optim/total_tokens": 1967422177280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2573962211608887, "created_at": "2025-06-03T07:25:11.108700+00:00"} {"global_step": 234536, "acc_step": 0, "speed/wps": 5504.314314880397, "speed/FLOPS": 243262519083048.16, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.69 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.69, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046669211238622665, "optim/lr": 1.5838360046894317e-05, "optim/total_tokens": 1967430565888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2511659860610962, "created_at": "2025-06-03T07:25:14.092877+00:00"} {"global_step": 234537, "acc_step": 0, "speed/wps": 5523.855116614564, "speed/FLOPS": 244126122500808.12, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049306098371744156, "optim/lr": 1.583481282179977e-05, "optim/total_tokens": 1967438954496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2707303762435913, "created_at": "2025-06-03T07:25:17.063264+00:00"} {"global_step": 234538, "acc_step": 0, "speed/wps": 5517.201692838121, "speed/FLOPS": 243832075225199.4, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04671863839030266, "optim/lr": 1.5831265596705448e-05, "optim/total_tokens": 1967447343104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2739293575286865, "created_at": "2025-06-03T07:25:20.039234+00:00"} {"global_step": 234539, "acc_step": 0, "speed/wps": 5523.690494641763, "speed/FLOPS": 244118847052221.94, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0503121018409729, "optim/lr": 1.58277183716109e-05, "optim/total_tokens": 1967455731712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2702292203903198, "created_at": "2025-06-03T07:25:23.008684+00:00"} {"global_step": 234540, "acc_step": 0, "speed/wps": 5521.361597045245, "speed/FLOPS": 244015921698834.34, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049366921186447144, "optim/lr": 1.582417114651635e-05, "optim/total_tokens": 1967464120320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2864651679992676, "created_at": "2025-06-03T07:25:25.980067+00:00"} {"global_step": 234541, "acc_step": 0, "speed/wps": 5512.84818958063, "speed/FLOPS": 243639672664468.0, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04621676355600357, "optim/lr": 1.5820623921421805e-05, "optim/total_tokens": 1967472508928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2784833908081055, "created_at": "2025-06-03T07:25:28.957031+00:00"} {"global_step": 234542, "acc_step": 0, "speed/wps": 5522.586968558329, "speed/FLOPS": 244070076847692.72, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04905163496732712, "optim/lr": 1.5817076696327482e-05, "optim/total_tokens": 1967480897536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2630300521850586, "created_at": "2025-06-03T07:25:31.929104+00:00"} {"global_step": 234543, "acc_step": 0, "speed/wps": 5512.38051795621, "speed/FLOPS": 243619003972429.0, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.68 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.68, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047797463834285736, "optim/lr": 1.5813529471232936e-05, "optim/total_tokens": 1967489286144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2601937055587769, "created_at": "2025-06-03T07:25:34.908766+00:00"} {"global_step": 234544, "acc_step": 0, "speed/wps": 5524.884604010093, "speed/FLOPS": 244171620574296.34, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05020684376358986, "optim/lr": 1.580998224613839e-05, "optim/total_tokens": 1967497674752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2641874551773071, "created_at": "2025-06-03T07:25:37.879175+00:00"} {"global_step": 234545, "acc_step": 0, "speed/wps": 5530.441919700004, "speed/FLOPS": 244417225482870.12, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05227092280983925, "optim/lr": 1.580643502104384e-05, "optim/total_tokens": 1967506063360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2688555717468262, "created_at": "2025-06-03T07:25:40.849649+00:00"} {"global_step": 234546, "acc_step": 0, "speed/wps": 5520.998541889875, "speed/FLOPS": 243999876519251.75, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047062620520591736, "optim/lr": 1.5802887795949517e-05, "optim/total_tokens": 1967514451968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2576038837432861, "created_at": "2025-06-03T07:25:43.820732+00:00"} {"global_step": 234547, "acc_step": 0, "speed/wps": 5523.437792831998, "speed/FLOPS": 244107678925675.47, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05134465917944908, "optim/lr": 1.579934057085497e-05, "optim/total_tokens": 1967522840576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2631657123565674, "created_at": "2025-06-03T07:25:46.790668+00:00"} {"global_step": 234548, "acc_step": 0, "speed/wps": 5526.206859139335, "speed/FLOPS": 244230057483093.56, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04667568951845169, "optim/lr": 1.5795793345760424e-05, "optim/total_tokens": 1967531229184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2752835750579834, "created_at": "2025-06-03T07:25:49.759411+00:00"} {"global_step": 234549, "acc_step": 0, "speed/wps": 5528.338267419611, "speed/FLOPS": 244324254819545.2, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.048179131001234055, "optim/lr": 1.5792246120665878e-05, "optim/total_tokens": 1967539617792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2834023237228394, "created_at": "2025-06-03T07:25:52.727194+00:00"} {"global_step": 234550, "acc_step": 0, "speed/wps": 5512.915424739742, "speed/FLOPS": 243642644114360.0, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04786190018057823, "optim/lr": 1.578869889557155e-05, "optim/total_tokens": 1967548006400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2757606506347656, "created_at": "2025-06-03T07:25:55.703503+00:00"} {"global_step": 234551, "acc_step": 0, "speed/wps": 5520.176426969218, "speed/FLOPS": 243963543247724.3, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04479646310210228, "optim/lr": 1.5785151670477005e-05, "optim/total_tokens": 1967556395008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2520732879638672, "created_at": "2025-06-03T07:25:58.675278+00:00"} {"global_step": 234552, "acc_step": 0, "speed/wps": 5514.193882834153, "speed/FLOPS": 243699145418391.25, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.052578940987586975, "optim/lr": 1.578160444538246e-05, "optim/total_tokens": 1967564783616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2757272720336914, "created_at": "2025-06-03T07:26:01.653312+00:00"} {"global_step": 234553, "acc_step": 0, "speed/wps": 5510.759393339265, "speed/FLOPS": 243547358562028.06, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046496108174324036, "optim/lr": 1.5778057220287912e-05, "optim/total_tokens": 1967573172224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2546769380569458, "created_at": "2025-06-03T07:26:04.634291+00:00"} {"global_step": 234554, "acc_step": 0, "speed/wps": 5532.120129839263, "speed/FLOPS": 244491393781167.2, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04896622523665428, "optim/lr": 1.5774509995193586e-05, "optim/total_tokens": 1967581560832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.25376558303833, "created_at": "2025-06-03T07:26:07.603005+00:00"} {"global_step": 234555, "acc_step": 0, "speed/wps": 5527.973710569287, "speed/FLOPS": 244308143272731.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05284591019153595, "optim/lr": 1.577096277009904e-05, "optim/total_tokens": 1967589949440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2585704326629639, "created_at": "2025-06-03T07:26:10.575927+00:00"} {"global_step": 234556, "acc_step": 0, "speed/wps": 5510.685952839736, "speed/FLOPS": 243544112867851.44, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04933599382638931, "optim/lr": 1.5767415545004493e-05, "optim/total_tokens": 1967598338048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.267661213874817, "created_at": "2025-06-03T07:26:13.553605+00:00"} {"global_step": 234557, "acc_step": 0, "speed/wps": 5513.547387968725, "speed/FLOPS": 243670573654400.03, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.67 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.67, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05539831891655922, "optim/lr": 1.5763868319909947e-05, "optim/total_tokens": 1967606726656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2696329355239868, "created_at": "2025-06-03T07:26:16.528815+00:00"} {"global_step": 234558, "acc_step": 0, "speed/wps": 5519.070783027798, "speed/FLOPS": 243914679444712.28, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04615338146686554, "optim/lr": 1.576032109481562e-05, "optim/total_tokens": 1967615115264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2626632452011108, "created_at": "2025-06-03T07:26:19.502866+00:00"} {"global_step": 234559, "acc_step": 0, "speed/wps": 5517.0245795203455, "speed/FLOPS": 243824247723101.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05559496954083443, "optim/lr": 1.5756773869721075e-05, "optim/total_tokens": 1967623503872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.265957236289978, "created_at": "2025-06-03T07:26:22.479770+00:00"} {"global_step": 234560, "acc_step": 0, "speed/wps": 5519.013355038463, "speed/FLOPS": 243912141421526.75, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04460781440138817, "optim/lr": 1.5753226644626528e-05, "optim/total_tokens": 1967631892480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2738975286483765, "created_at": "2025-06-03T07:26:25.452309+00:00"} {"global_step": 234561, "acc_step": 0, "speed/wps": 5523.704351333432, "speed/FLOPS": 244119459447068.75, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04630408063530922, "optim/lr": 1.5749679419531982e-05, "optim/total_tokens": 1967640281088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.279337763786316, "created_at": "2025-06-03T07:26:28.422022+00:00"} {"global_step": 234562, "acc_step": 0, "speed/wps": 5539.169192283403, "speed/FLOPS": 244802926260825.8, "speed/curr_iter_time": 2.9567, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9567, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 192.65, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.050824448466300964, "optim/lr": 1.5746132194437656e-05, "optim/total_tokens": 1967648669696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2684801816940308, "created_at": "2025-06-03T07:26:31.387083+00:00"} {"global_step": 234563, "acc_step": 0, "speed/wps": 5521.671030816041, "speed/FLOPS": 244029597087677.94, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045795198529958725, "optim/lr": 1.574258496934311e-05, "optim/total_tokens": 1967657058304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2782100439071655, "created_at": "2025-06-03T07:26:34.359431+00:00"} {"global_step": 234564, "acc_step": 0, "speed/wps": 5518.0070214904035, "speed/FLOPS": 243867666629584.6, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.66 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.66, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05871687829494476, "optim/lr": 1.5739037744248563e-05, "optim/total_tokens": 1967665446912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2569752931594849, "created_at": "2025-06-03T07:26:37.331783+00:00"} {"global_step": 234565, "acc_step": 0, "speed/wps": 5524.109818469005, "speed/FLOPS": 244137379019092.16, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04657275229692459, "optim/lr": 1.573549051915424e-05, "optim/total_tokens": 1967673835520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2679007053375244, "created_at": "2025-06-03T07:26:40.301024+00:00"} {"global_step": 234566, "acc_step": 0, "speed/wps": 5528.788011535734, "speed/FLOPS": 244344131207478.75, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04961726441979408, "optim/lr": 1.573194329405969e-05, "optim/total_tokens": 1967682224128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2755250930786133, "created_at": "2025-06-03T07:26:43.267816+00:00"} {"global_step": 234567, "acc_step": 0, "speed/wps": 5531.602616659307, "speed/FLOPS": 244468522347485.72, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04863174259662628, "optim/lr": 1.5728396068965144e-05, "optim/total_tokens": 1967690612736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2792651653289795, "created_at": "2025-06-03T07:26:46.233324+00:00"} {"global_step": 234568, "acc_step": 0, "speed/wps": 5525.023707249213, "speed/FLOPS": 244177768225470.5, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04591786488890648, "optim/lr": 1.5724848843870597e-05, "optim/total_tokens": 1967699001344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2786898612976074, "created_at": "2025-06-03T07:26:49.202333+00:00"} {"global_step": 234569, "acc_step": 0, "speed/wps": 5526.640842821157, "speed/FLOPS": 244249237340500.22, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.051956165581941605, "optim/lr": 1.5721301618776275e-05, "optim/total_tokens": 1967707389952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2631436586380005, "created_at": "2025-06-03T07:26:52.172120+00:00"} {"global_step": 234570, "acc_step": 0, "speed/wps": 5533.5557328911955, "speed/FLOPS": 244554840087980.03, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 192.73, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04619169980287552, "optim/lr": 1.5717754393681728e-05, "optim/total_tokens": 1967715778560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2725334167480469, "created_at": "2025-06-03T07:26:55.136651+00:00"} {"global_step": 234571, "acc_step": 0, "speed/wps": 5529.07062811994, "speed/FLOPS": 244356621413937.84, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.050050005316734314, "optim/lr": 1.571420716858718e-05, "optim/total_tokens": 1967724167168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2738745212554932, "created_at": "2025-06-03T07:26:58.103549+00:00"} {"global_step": 234572, "acc_step": 0, "speed/wps": 5526.651115136694, "speed/FLOPS": 244249691324268.5, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049650244414806366, "optim/lr": 1.5710659943492632e-05, "optim/total_tokens": 1967732555776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.266282558441162, "created_at": "2025-06-03T07:27:01.071544+00:00"} {"global_step": 234573, "acc_step": 0, "speed/wps": 5519.659178077777, "speed/FLOPS": 243940683494242.5, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046163734048604965, "optim/lr": 1.570711271839831e-05, "optim/total_tokens": 1967740944384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.252502202987671, "created_at": "2025-06-03T07:27:04.043856+00:00"} {"global_step": 234574, "acc_step": 0, "speed/wps": 5521.926340286415, "speed/FLOPS": 244040880459476.16, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.052583545446395874, "optim/lr": 1.5703565493303763e-05, "optim/total_tokens": 1967749332992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.276713252067566, "created_at": "2025-06-03T07:27:07.015348+00:00"} {"global_step": 234575, "acc_step": 0, "speed/wps": 5513.595100476139, "speed/FLOPS": 243672682303013.0, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045353252440690994, "optim/lr": 1.5700018268209217e-05, "optim/total_tokens": 1967757721600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2679787874221802, "created_at": "2025-06-03T07:27:09.991082+00:00"} {"global_step": 234576, "acc_step": 0, "speed/wps": 5507.153226131108, "speed/FLOPS": 243387984429464.53, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.048451635986566544, "optim/lr": 1.569647104311467e-05, "optim/total_tokens": 1967766110208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.258901834487915, "created_at": "2025-06-03T07:27:12.969483+00:00"} {"global_step": 234577, "acc_step": 0, "speed/wps": 5503.238738834517, "speed/FLOPS": 243214984127117.53, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04846160486340523, "optim/lr": 1.5692923818020344e-05, "optim/total_tokens": 1967774498816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.272416591644287, "created_at": "2025-06-03T07:27:15.952946+00:00"} {"global_step": 234578, "acc_step": 0, "speed/wps": 5511.016756509382, "speed/FLOPS": 243558732696843.06, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04592563584446907, "optim/lr": 1.5689376592925798e-05, "optim/total_tokens": 1967782887424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2838104963302612, "created_at": "2025-06-03T07:27:18.930009+00:00"} {"global_step": 234579, "acc_step": 0, "speed/wps": 5522.507118378084, "speed/FLOPS": 244066547878436.12, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05194831266999245, "optim/lr": 1.568582936783125e-05, "optim/total_tokens": 1967791276032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.271741271018982, "created_at": "2025-06-03T07:27:21.905646+00:00"} {"global_step": 234580, "acc_step": 0, "speed/wps": 5532.611770757163, "speed/FLOPS": 244513121793292.0, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 192.79, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045548174530267715, "optim/lr": 1.5682282142736705e-05, "optim/total_tokens": 1967799664640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.260072946548462, "created_at": "2025-06-03T07:27:24.871196+00:00"} {"global_step": 234581, "acc_step": 0, "speed/wps": 5519.615922120011, "speed/FLOPS": 243938771802313.3, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046849921345710754, "optim/lr": 1.567873491764238e-05, "optim/total_tokens": 1967808053248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2749515771865845, "created_at": "2025-06-03T07:27:27.843462+00:00"} {"global_step": 234582, "acc_step": 0, "speed/wps": 5529.030151703809, "speed/FLOPS": 244354832563521.94, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049483105540275574, "optim/lr": 1.5675187692547832e-05, "optim/total_tokens": 1967816441856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2513794898986816, "created_at": "2025-06-03T07:27:30.810614+00:00"} {"global_step": 234583, "acc_step": 0, "speed/wps": 5518.754734609261, "speed/FLOPS": 243900711722295.4, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04507610946893692, "optim/lr": 1.5671640467453286e-05, "optim/total_tokens": 1967824830464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2676806449890137, "created_at": "2025-06-03T07:27:33.783105+00:00"} {"global_step": 234584, "acc_step": 0, "speed/wps": 5521.722775318245, "speed/FLOPS": 244031883929823.0, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05558991804718971, "optim/lr": 1.566809324235874e-05, "optim/total_tokens": 1967833219072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2601203918457031, "created_at": "2025-06-03T07:27:36.753740+00:00"} {"global_step": 234585, "acc_step": 0, "speed/wps": 5509.71570796526, "speed/FLOPS": 243501233010563.03, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.65 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.65, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0489593967795372, "optim/lr": 1.5664546017264413e-05, "optim/total_tokens": 1967841607680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2796207666397095, "created_at": "2025-06-03T07:27:39.730728+00:00"} {"global_step": 234586, "acc_step": 0, "speed/wps": 5515.847060557927, "speed/FLOPS": 243772207412051.4, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.64 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.64, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04844837635755539, "optim/lr": 1.5660998792169867e-05, "optim/total_tokens": 1967849996288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.261284589767456, "created_at": "2025-06-03T07:27:42.708727+00:00"} {"global_step": 234587, "acc_step": 0, "speed/wps": 5524.161852409034, "speed/FLOPS": 244139678652907.56, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04586544260382652, "optim/lr": 1.565745156707532e-05, "optim/total_tokens": 1967858384896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2589424848556519, "created_at": "2025-06-03T07:27:45.679143+00:00"} {"global_step": 234588, "acc_step": 0, "speed/wps": 5525.568362108381, "speed/FLOPS": 244201839182449.44, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0554635226726532, "optim/lr": 1.5653904341980774e-05, "optim/total_tokens": 1967866773504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.274671196937561, "created_at": "2025-06-03T07:27:48.648302+00:00"} {"global_step": 234589, "acc_step": 0, "speed/wps": 5529.248149906855, "speed/FLOPS": 244364466968280.66, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047584764659404755, "optim/lr": 1.5650357116886448e-05, "optim/total_tokens": 1967875162112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2832762002944946, "created_at": "2025-06-03T07:27:51.615799+00:00"} {"global_step": 234590, "acc_step": 0, "speed/wps": 5522.656873005063, "speed/FLOPS": 244073166266434.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05088862031698227, "optim/lr": 1.56468098917919e-05, "optim/total_tokens": 1967883550720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2626577615737915, "created_at": "2025-06-03T07:27:54.586577+00:00"} {"global_step": 234591, "acc_step": 0, "speed/wps": 5529.450454809376, "speed/FLOPS": 244373407809481.72, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04715659096837044, "optim/lr": 1.5643262666697355e-05, "optim/total_tokens": 1967891939328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2606955766677856, "created_at": "2025-06-03T07:27:57.553707+00:00"} {"global_step": 234592, "acc_step": 0, "speed/wps": 5526.786645912112, "speed/FLOPS": 244255681090832.6, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04917634278535843, "optim/lr": 1.5639715441603032e-05, "optim/total_tokens": 1967900327936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2816561460494995, "created_at": "2025-06-03T07:28:00.523259+00:00"} {"global_step": 234593, "acc_step": 0, "speed/wps": 5513.694599338328, "speed/FLOPS": 243677079643440.38, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04550119489431381, "optim/lr": 1.5636168216508483e-05, "optim/total_tokens": 1967908716544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2844208478927612, "created_at": "2025-06-03T07:28:03.499366+00:00"} {"global_step": 234594, "acc_step": 0, "speed/wps": 5517.444465684506, "speed/FLOPS": 243842804542385.56, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04470552131533623, "optim/lr": 1.5632620991413936e-05, "optim/total_tokens": 1967917105152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2744779586791992, "created_at": "2025-06-03T07:28:06.473115+00:00"} {"global_step": 234595, "acc_step": 0, "speed/wps": 5525.73932872892, "speed/FLOPS": 244209395031990.75, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04830086976289749, "optim/lr": 1.562907376631939e-05, "optim/total_tokens": 1967925493760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2673641443252563, "created_at": "2025-06-03T07:28:09.442261+00:00"} {"global_step": 234596, "acc_step": 0, "speed/wps": 5520.79312523345, "speed/FLOPS": 243990798154455.53, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04597805440425873, "optim/lr": 1.5625526541225067e-05, "optim/total_tokens": 1967933882368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.274765968322754, "created_at": "2025-06-03T07:28:12.414401+00:00"} {"global_step": 234597, "acc_step": 0, "speed/wps": 5525.3121361367885, "speed/FLOPS": 244190515305988.47, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.048046380281448364, "optim/lr": 1.562197931613052e-05, "optim/total_tokens": 1967942270976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2578803300857544, "created_at": "2025-06-03T07:28:15.386333+00:00"} {"global_step": 234598, "acc_step": 0, "speed/wps": 5522.665379896939, "speed/FLOPS": 244073542227513.66, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04751340299844742, "optim/lr": 1.561843209103597e-05, "optim/total_tokens": 1967950659584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2719976902008057, "created_at": "2025-06-03T07:28:18.359404+00:00"} {"global_step": 234599, "acc_step": 0, "speed/wps": 5527.087292763896, "speed/FLOPS": 244268968142831.3, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04830600693821907, "optim/lr": 1.5614884865941424e-05, "optim/total_tokens": 1967959048192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.265310287475586, "created_at": "2025-06-03T07:28:21.327835+00:00"} {"global_step": 234600, "acc_step": 0, "speed/wps": 5511.155525725753, "speed/FLOPS": 243564865585921.47, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047529954463243484, "optim/lr": 1.56113376408471e-05, "optim/total_tokens": 1967967436800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2755427360534668, "created_at": "2025-06-03T07:28:24.304973+00:00"} {"global_step": 234601, "acc_step": 0, "speed/wps": 5514.815595744763, "speed/FLOPS": 243726621946825.1, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045506417751312256, "optim/lr": 1.5607790415752555e-05, "optim/total_tokens": 1967975825408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.265387773513794, "created_at": "2025-06-03T07:28:27.280127+00:00"} {"global_step": 234602, "acc_step": 0, "speed/wps": 5512.964993877182, "speed/FLOPS": 243644834816517.0, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045649852603673935, "optim/lr": 1.560424319065801e-05, "optim/total_tokens": 1967984214016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.284936547279358, "created_at": "2025-06-03T07:28:30.256284+00:00"} {"global_step": 234603, "acc_step": 0, "speed/wps": 5512.927936469304, "speed/FLOPS": 243643197068765.8, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04545414075255394, "optim/lr": 1.560069596556346e-05, "optim/total_tokens": 1967992602624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2676371335983276, "created_at": "2025-06-03T07:28:33.232408+00:00"} {"global_step": 234604, "acc_step": 0, "speed/wps": 5536.570552524644, "speed/FLOPS": 244688079684532.72, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 192.78, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0447501577436924, "optim/lr": 1.5597148740469136e-05, "optim/total_tokens": 1968000991232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2715973854064941, "created_at": "2025-06-03T07:28:36.199914+00:00"} {"global_step": 234605, "acc_step": 0, "speed/wps": 5527.347412870371, "speed/FLOPS": 244280464120122.12, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.051881931722164154, "optim/lr": 1.559360151537459e-05, "optim/total_tokens": 1968009379840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2693452835083008, "created_at": "2025-06-03T07:28:39.173438+00:00"} {"global_step": 234606, "acc_step": 0, "speed/wps": 5524.32066502502, "speed/FLOPS": 244146697357657.5, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046083588153123856, "optim/lr": 1.5590054290280044e-05, "optim/total_tokens": 1968017768448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2669638395309448, "created_at": "2025-06-03T07:28:42.143835+00:00"} {"global_step": 234607, "acc_step": 0, "speed/wps": 5529.764625983606, "speed/FLOPS": 244387292567308.78, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045018959790468216, "optim/lr": 1.5586507065185497e-05, "optim/total_tokens": 1968026157056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2616337537765503, "created_at": "2025-06-03T07:28:45.110968+00:00"} {"global_step": 234608, "acc_step": 0, "speed/wps": 5529.563679405602, "speed/FLOPS": 244378411757098.84, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04709659889340401, "optim/lr": 1.558295984009117e-05, "optim/total_tokens": 1968034545664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2721378803253174, "created_at": "2025-06-03T07:28:48.078120+00:00"} {"global_step": 234609, "acc_step": 0, "speed/wps": 5516.915705650062, "speed/FLOPS": 243819436055302.3, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04536043852567673, "optim/lr": 1.5579412614996625e-05, "optim/total_tokens": 1968042934272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.263780951499939, "created_at": "2025-06-03T07:28:51.056302+00:00"} {"global_step": 234610, "acc_step": 0, "speed/wps": 5514.180414742228, "speed/FLOPS": 243698550197664.12, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05046675726771355, "optim/lr": 1.5575865389902078e-05, "optim/total_tokens": 1968051322880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2672977447509766, "created_at": "2025-06-03T07:28:54.034938+00:00"} {"global_step": 234611, "acc_step": 0, "speed/wps": 5507.4162327943395, "speed/FLOPS": 243399607977789.22, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.63 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.63, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0447869710624218, "optim/lr": 1.5572318164807532e-05, "optim/total_tokens": 1968059711488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2648800611495972, "created_at": "2025-06-03T07:28:57.014543+00:00"} {"global_step": 234612, "acc_step": 0, "speed/wps": 5522.547338981993, "speed/FLOPS": 244068325423261.2, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04800200089812279, "optim/lr": 1.5568770939713206e-05, "optim/total_tokens": 1968068100096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.261084794998169, "created_at": "2025-06-03T07:28:59.984780+00:00"} {"global_step": 234613, "acc_step": 0, "speed/wps": 5518.624609226066, "speed/FLOPS": 243894960846400.28, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04712449386715889, "optim/lr": 1.556522371461866e-05, "optim/total_tokens": 1968076488704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.267087697982788, "created_at": "2025-06-03T07:29:02.957842+00:00"} {"global_step": 234614, "acc_step": 0, "speed/wps": 5525.1366890243025, "speed/FLOPS": 244182761441636.3, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05086943134665489, "optim/lr": 1.5561676489524113e-05, "optim/total_tokens": 1968084877312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2592394351959229, "created_at": "2025-06-03T07:29:05.929843+00:00"} {"global_step": 234615, "acc_step": 0, "speed/wps": 5515.958014788938, "speed/FLOPS": 243777111021146.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046301402151584625, "optim/lr": 1.5558129264429566e-05, "optim/total_tokens": 1968093265920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.27297043800354, "created_at": "2025-06-03T07:29:08.904914+00:00"} {"global_step": 234616, "acc_step": 0, "speed/wps": 5514.230681147601, "speed/FLOPS": 243700771715494.8, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.62 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.62, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047962870448827744, "optim/lr": 1.555458203933524e-05, "optim/total_tokens": 1968101654528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2617002725601196, "created_at": "2025-06-03T07:29:11.880258+00:00"} {"global_step": 234617, "acc_step": 0, "speed/wps": 5516.18379937589, "speed/FLOPS": 243787089544219.84, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04556369036436081, "optim/lr": 1.5551034814240694e-05, "optim/total_tokens": 1968110043136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2626005411148071, "created_at": "2025-06-03T07:29:14.855404+00:00"} {"global_step": 234618, "acc_step": 0, "speed/wps": 5529.3419411040395, "speed/FLOPS": 244368612059129.3, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04633896425366402, "optim/lr": 1.5547487589146147e-05, "optim/total_tokens": 1968118431744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.260290503501892, "created_at": "2025-06-03T07:29:17.825604+00:00"} {"global_step": 234619, "acc_step": 0, "speed/wps": 5519.841935693814, "speed/FLOPS": 243948760445433.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04604705795645714, "optim/lr": 1.55439403640516e-05, "optim/total_tokens": 1968126820352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2526535987854004, "created_at": "2025-06-03T07:29:20.799741+00:00"} {"global_step": 234620, "acc_step": 0, "speed/wps": 5516.980912844627, "speed/FLOPS": 243822317879541.44, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04751008003950119, "optim/lr": 1.5540393138957275e-05, "optim/total_tokens": 1968135208960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2591068744659424, "created_at": "2025-06-03T07:29:23.779350+00:00"} {"global_step": 234621, "acc_step": 0, "speed/wps": 5525.263559024534, "speed/FLOPS": 244188368446267.0, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045251987874507904, "optim/lr": 1.553684591386273e-05, "optim/total_tokens": 1968143597568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2568724155426025, "created_at": "2025-06-03T07:29:26.751083+00:00"} {"global_step": 234622, "acc_step": 0, "speed/wps": 5522.700286730884, "speed/FLOPS": 244075084930904.66, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04786936193704605, "optim/lr": 1.5533298688768182e-05, "optim/total_tokens": 1968151986176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2624214887619019, "created_at": "2025-06-03T07:29:29.722071+00:00"} {"global_step": 234623, "acc_step": 0, "speed/wps": 5526.931158307393, "speed/FLOPS": 244262067799022.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047195374965667725, "optim/lr": 1.552975146367386e-05, "optim/total_tokens": 1968160374784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2606948614120483, "created_at": "2025-06-03T07:29:32.690256+00:00"} {"global_step": 234624, "acc_step": 0, "speed/wps": 5512.716311073116, "speed/FLOPS": 243633844309451.28, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047066036611795425, "optim/lr": 1.552620423857931e-05, "optim/total_tokens": 1968168763392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2694334983825684, "created_at": "2025-06-03T07:29:35.667803+00:00"} {"global_step": 234625, "acc_step": 0, "speed/wps": 5527.797668841032, "speed/FLOPS": 244300363129406.34, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.09, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04581860825419426, "optim/lr": 1.5522657013484763e-05, "optim/total_tokens": 1968177152000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2582989931106567, "created_at": "2025-06-03T07:29:38.635960+00:00"} {"global_step": 234626, "acc_step": 0, "speed/wps": 5516.4473756824655, "speed/FLOPS": 243798738267864.66, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.61 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.61, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.055413417518138885, "optim/lr": 1.5519109788390217e-05, "optim/total_tokens": 1968185540608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2608352899551392, "created_at": "2025-06-03T07:29:41.612668+00:00"} {"global_step": 234627, "acc_step": 0, "speed/wps": 5515.470459101879, "speed/FLOPS": 243755563555315.06, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04534360021352768, "optim/lr": 1.5515562563295894e-05, "optim/total_tokens": 1968193929216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2612227201461792, "created_at": "2025-06-03T07:29:44.587435+00:00"} {"global_step": 234628, "acc_step": 0, "speed/wps": 5532.935967035262, "speed/FLOPS": 244527449609397.03, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.053393106907606125, "optim/lr": 1.5512015338201348e-05, "optim/total_tokens": 1968202317824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.273905873298645, "created_at": "2025-06-03T07:29:47.553069+00:00"} {"global_step": 234629, "acc_step": 0, "speed/wps": 5532.6892194361235, "speed/FLOPS": 244516544628483.78, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0464264415204525, "optim/lr": 1.5508468113106798e-05, "optim/total_tokens": 1968210706432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2626805305480957, "created_at": "2025-06-03T07:29:50.520712+00:00"} {"global_step": 234630, "acc_step": 0, "speed/wps": 5526.039199857537, "speed/FLOPS": 244222647800996.06, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05062925070524216, "optim/lr": 1.550492088801225e-05, "optim/total_tokens": 1968219095040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.267811894416809, "created_at": "2025-06-03T07:29:53.490126+00:00"} {"global_step": 234631, "acc_step": 0, "speed/wps": 5516.787875353407, "speed/FLOPS": 243813786610484.94, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04910518229007721, "optim/lr": 1.550137366291793e-05, "optim/total_tokens": 1968227483648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2759687900543213, "created_at": "2025-06-03T07:29:56.464386+00:00"} {"global_step": 234632, "acc_step": 0, "speed/wps": 5523.175361045752, "speed/FLOPS": 244096080783971.03, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05030788853764534, "optim/lr": 1.5497826437823382e-05, "optim/total_tokens": 1968235872256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2509220838546753, "created_at": "2025-06-03T07:29:59.434526+00:00"} {"global_step": 234633, "acc_step": 0, "speed/wps": 5535.205735172919, "speed/FLOPS": 244627761743354.94, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04746479168534279, "optim/lr": 1.5494279212728836e-05, "optim/total_tokens": 1968244260864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2782865762710571, "created_at": "2025-06-03T07:30:02.402516+00:00"} {"global_step": 234634, "acc_step": 0, "speed/wps": 5509.1280842997685, "speed/FLOPS": 243475263052278.88, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04521764814853668, "optim/lr": 1.549073198763429e-05, "optim/total_tokens": 1968252649472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264643669128418, "created_at": "2025-06-03T07:30:05.383058+00:00"} {"global_step": 234635, "acc_step": 0, "speed/wps": 5514.008567422761, "speed/FLOPS": 243690955425738.0, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.059279654175043106, "optim/lr": 1.5487184762539963e-05, "optim/total_tokens": 1968261038080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2805798053741455, "created_at": "2025-06-03T07:30:08.358253+00:00"} {"global_step": 234636, "acc_step": 0, "speed/wps": 5517.880235291364, "speed/FLOPS": 243862063328537.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04585793986916542, "optim/lr": 1.5483637537445417e-05, "optim/total_tokens": 1968269426688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.272998332977295, "created_at": "2025-06-03T07:30:11.331341+00:00"} {"global_step": 234637, "acc_step": 0, "speed/wps": 5513.557626356521, "speed/FLOPS": 243671026138735.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05011830851435661, "optim/lr": 1.548009031235087e-05, "optim/total_tokens": 1968277815296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2427197694778442, "created_at": "2025-06-03T07:30:14.306450+00:00"} {"global_step": 234638, "acc_step": 0, "speed/wps": 5529.162709384613, "speed/FLOPS": 244360690934521.75, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045584291219711304, "optim/lr": 1.5476543087256324e-05, "optim/total_tokens": 1968286203904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.256636142730713, "created_at": "2025-06-03T07:30:17.277202+00:00"} {"global_step": 234639, "acc_step": 0, "speed/wps": 5518.209018712744, "speed/FLOPS": 243876593872896.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04758428409695625, "optim/lr": 1.5472995862161998e-05, "optim/total_tokens": 1968294592512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2790591716766357, "created_at": "2025-06-03T07:30:20.250885+00:00"} {"global_step": 234640, "acc_step": 0, "speed/wps": 5527.05177521469, "speed/FLOPS": 244267398448951.72, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04626920819282532, "optim/lr": 1.546944863706745e-05, "optim/total_tokens": 1968302981120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2750201225280762, "created_at": "2025-06-03T07:30:23.219089+00:00"} {"global_step": 234641, "acc_step": 0, "speed/wps": 5513.61477367484, "speed/FLOPS": 243673551757699.0, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04520628973841667, "optim/lr": 1.5465901411972905e-05, "optim/total_tokens": 1968311369728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.261096715927124, "created_at": "2025-06-03T07:30:26.193119+00:00"} {"global_step": 234642, "acc_step": 0, "speed/wps": 5532.124777334342, "speed/FLOPS": 244491599176661.62, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046493835747241974, "optim/lr": 1.546235418687836e-05, "optim/total_tokens": 1968319758336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2728267908096313, "created_at": "2025-06-03T07:30:29.158666+00:00"} {"global_step": 234643, "acc_step": 0, "speed/wps": 5523.340682820453, "speed/FLOPS": 244103387160219.28, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04805755242705345, "optim/lr": 1.5458806961784033e-05, "optim/total_tokens": 1968328146944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2654684782028198, "created_at": "2025-06-03T07:30:32.128689+00:00"} {"global_step": 234644, "acc_step": 0, "speed/wps": 5510.053414859334, "speed/FLOPS": 243516157926740.53, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.6 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.6, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0488484725356102, "optim/lr": 1.5455259736689486e-05, "optim/total_tokens": 1968336535552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2760504484176636, "created_at": "2025-06-03T07:30:35.109587+00:00"} {"global_step": 234645, "acc_step": 0, "speed/wps": 5532.617424345143, "speed/FLOPS": 244513371652943.06, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 192.95, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04641954228281975, "optim/lr": 1.545171251159494e-05, "optim/total_tokens": 1968344924160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.264028787612915, "created_at": "2025-06-03T07:30:38.074815+00:00"} {"global_step": 234646, "acc_step": 0, "speed/wps": 5525.258326959975, "speed/FLOPS": 244188137215793.66, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049071792513132095, "optim/lr": 1.5448165286500393e-05, "optim/total_tokens": 1968353312768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2738434076309204, "created_at": "2025-06-03T07:30:41.045607+00:00"} {"global_step": 234647, "acc_step": 0, "speed/wps": 5517.7112022901465, "speed/FLOPS": 243854592935073.16, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04737528786063194, "optim/lr": 1.5444618061406067e-05, "optim/total_tokens": 1968361701376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2627549171447754, "created_at": "2025-06-03T07:30:44.018400+00:00"} {"global_step": 234648, "acc_step": 0, "speed/wps": 5524.421141647883, "speed/FLOPS": 244151137910102.06, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04697519168257713, "optim/lr": 1.544107083631152e-05, "optim/total_tokens": 1968370089984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2660572528839111, "created_at": "2025-06-03T07:30:46.987462+00:00"} {"global_step": 234649, "acc_step": 0, "speed/wps": 5522.612586619523, "speed/FLOPS": 244071209034872.38, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05414680019021034, "optim/lr": 1.5437523611216974e-05, "optim/total_tokens": 1968378478592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2728983163833618, "created_at": "2025-06-03T07:30:49.957772+00:00"} {"global_step": 234650, "acc_step": 0, "speed/wps": 5522.352951829855, "speed/FLOPS": 244059734506100.34, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04897749051451683, "optim/lr": 1.5433976386122652e-05, "optim/total_tokens": 1968386867200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2550055980682373, "created_at": "2025-06-03T07:30:52.929934+00:00"} {"global_step": 234651, "acc_step": 0, "speed/wps": 5516.398566414116, "speed/FLOPS": 243796581148032.1, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05191827937960625, "optim/lr": 1.5430429161028102e-05, "optim/total_tokens": 1968395255808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.26743745803833, "created_at": "2025-06-03T07:30:55.903715+00:00"} {"global_step": 234652, "acc_step": 0, "speed/wps": 5516.560198554267, "speed/FLOPS": 243803724461318.47, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04592743515968323, "optim/lr": 1.5426881935933556e-05, "optim/total_tokens": 1968403644416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2616796493530273, "created_at": "2025-06-03T07:30:58.877523+00:00"} {"global_step": 234653, "acc_step": 0, "speed/wps": 5509.603033308309, "speed/FLOPS": 243496253367446.97, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.59 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.59, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05279173329472542, "optim/lr": 1.542333471083901e-05, "optim/total_tokens": 1968412033024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.261681079864502, "created_at": "2025-06-03T07:31:01.857682+00:00"} {"global_step": 234654, "acc_step": 0, "speed/wps": 5541.811555923185, "speed/FLOPS": 244919705208860.97, "speed/curr_iter_time": 2.9543, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9543, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 192.57, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0453689806163311, "optim/lr": 1.5419787485744686e-05, "optim/total_tokens": 1968420421632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.262688159942627, "created_at": "2025-06-03T07:31:04.817806+00:00"} {"global_step": 234655, "acc_step": 0, "speed/wps": 5523.1470920850925, "speed/FLOPS": 244094831440603.53, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04909973219037056, "optim/lr": 1.541624026065014e-05, "optim/total_tokens": 1968428810240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.275841474533081, "created_at": "2025-06-03T07:31:07.788094+00:00"} {"global_step": 234656, "acc_step": 0, "speed/wps": 5527.672142704426, "speed/FLOPS": 244294815516669.38, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047354571521282196, "optim/lr": 1.541269303555559e-05, "optim/total_tokens": 1968437198848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2615323066711426, "created_at": "2025-06-03T07:31:10.755308+00:00"} {"global_step": 234657, "acc_step": 0, "speed/wps": 5515.625434392276, "speed/FLOPS": 243762412669915.16, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045301806181669235, "optim/lr": 1.5409145810461044e-05, "optim/total_tokens": 1968445587456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.279013991355896, "created_at": "2025-06-03T07:31:13.730475+00:00"} {"global_step": 234658, "acc_step": 0, "speed/wps": 5523.40209109203, "speed/FLOPS": 244106101091506.94, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05049246922135353, "optim/lr": 1.540559858536672e-05, "optim/total_tokens": 1968453976064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2771717309951782, "created_at": "2025-06-03T07:31:16.700156+00:00"} {"global_step": 234659, "acc_step": 0, "speed/wps": 5522.18261894365, "speed/FLOPS": 244052206664372.8, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045566625893116, "optim/lr": 1.5402051360272175e-05, "optim/total_tokens": 1968462364672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2784138917922974, "created_at": "2025-06-03T07:31:19.673915+00:00"} {"global_step": 234660, "acc_step": 0, "speed/wps": 5513.31041274904, "speed/FLOPS": 243660100562639.06, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04742544889450073, "optim/lr": 1.5398504135177628e-05, "optim/total_tokens": 1968470753280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2689121961593628, "created_at": "2025-06-03T07:31:22.654363+00:00"} {"global_step": 234661, "acc_step": 0, "speed/wps": 5512.2732220108655, "speed/FLOPS": 243614262040835.22, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.58 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.58, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0457175150513649, "optim/lr": 1.539495691008308e-05, "optim/total_tokens": 1968479141888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.271074652671814, "created_at": "2025-06-03T07:31:25.630015+00:00"} {"global_step": 234662, "acc_step": 0, "speed/wps": 5523.485609902754, "speed/FLOPS": 244109792195452.9, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04594006389379501, "optim/lr": 1.5391409684988756e-05, "optim/total_tokens": 1968487530496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.274593472480774, "created_at": "2025-06-03T07:31:28.603149+00:00"} {"global_step": 234663, "acc_step": 0, "speed/wps": 5525.897449239087, "speed/FLOPS": 244216383149206.03, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046938635408878326, "optim/lr": 1.538786245989421e-05, "optim/total_tokens": 1968495919104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2619444131851196, "created_at": "2025-06-03T07:31:31.571922+00:00"} {"global_step": 234664, "acc_step": 0, "speed/wps": 5533.81674421104, "speed/FLOPS": 244566375452340.12, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 192.85, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04694440960884094, "optim/lr": 1.5384315234799663e-05, "optim/total_tokens": 1968504307712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2796924114227295, "created_at": "2025-06-03T07:31:34.540782+00:00"} {"global_step": 234665, "acc_step": 0, "speed/wps": 5519.928989693513, "speed/FLOPS": 243952607786637.0, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04576779901981354, "optim/lr": 1.5380768009705116e-05, "optim/total_tokens": 1968512696320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.277351975440979, "created_at": "2025-06-03T07:31:37.515927+00:00"} {"global_step": 234666, "acc_step": 0, "speed/wps": 5519.131516338944, "speed/FLOPS": 243917363546203.66, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05221223831176758, "optim/lr": 1.537722078461079e-05, "optim/total_tokens": 1968521084928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.285951852798462, "created_at": "2025-06-03T07:31:40.491095+00:00"} {"global_step": 234667, "acc_step": 0, "speed/wps": 5521.252856912254, "speed/FLOPS": 244011115941538.62, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04525512456893921, "optim/lr": 1.5373673559516244e-05, "optim/total_tokens": 1968529473536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2786699533462524, "created_at": "2025-06-03T07:31:43.466524+00:00"} {"global_step": 234668, "acc_step": 0, "speed/wps": 5530.24621798958, "speed/FLOPS": 244408576468961.53, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.051449667662382126, "optim/lr": 1.5370126334421698e-05, "optim/total_tokens": 1968537862144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2668310403823853, "created_at": "2025-06-03T07:31:46.433964+00:00"} {"global_step": 234669, "acc_step": 0, "speed/wps": 5518.495222233268, "speed/FLOPS": 243889242603581.25, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04652893543243408, "optim/lr": 1.536657910932715e-05, "optim/total_tokens": 1968546250752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2685054540634155, "created_at": "2025-06-03T07:31:49.408232+00:00"} {"global_step": 234670, "acc_step": 0, "speed/wps": 5521.559431573731, "speed/FLOPS": 244024664972384.53, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05222228169441223, "optim/lr": 1.5363031884232825e-05, "optim/total_tokens": 1968554639360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2586712837219238, "created_at": "2025-06-03T07:31:52.381221+00:00"} {"global_step": 234671, "acc_step": 0, "speed/wps": 5518.163969776965, "speed/FLOPS": 243874602940516.47, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05138295516371727, "optim/lr": 1.535948465913828e-05, "optim/total_tokens": 1968563027968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.267641544342041, "created_at": "2025-06-03T07:31:55.358351+00:00"} {"global_step": 234672, "acc_step": 0, "speed/wps": 5522.298509047342, "speed/FLOPS": 244057328413776.72, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.051210593432188034, "optim/lr": 1.5355937434043732e-05, "optim/total_tokens": 1968571416576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2670857906341553, "created_at": "2025-06-03T07:31:58.328424+00:00"} {"global_step": 234673, "acc_step": 0, "speed/wps": 5526.73709746914, "speed/FLOPS": 244253491303265.12, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05329781398177147, "optim/lr": 1.5352390208949186e-05, "optim/total_tokens": 1968579805184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2922096252441406, "created_at": "2025-06-03T07:32:01.297769+00:00"} {"global_step": 234674, "acc_step": 0, "speed/wps": 5523.304373661065, "speed/FLOPS": 244101782481221.47, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.048656683415174484, "optim/lr": 1.534884298385486e-05, "optim/total_tokens": 1968588193792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2671234607696533, "created_at": "2025-06-03T07:32:04.267915+00:00"} {"global_step": 234675, "acc_step": 0, "speed/wps": 5516.39187259694, "speed/FLOPS": 243796285315574.97, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0540011040866375, "optim/lr": 1.5345295758760313e-05, "optim/total_tokens": 1968596582400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2623804807662964, "created_at": "2025-06-03T07:32:07.242075+00:00"} {"global_step": 234676, "acc_step": 0, "speed/wps": 5514.96435606533, "speed/FLOPS": 243733196391569.78, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04534447565674782, "optim/lr": 1.5341748533665767e-05, "optim/total_tokens": 1968604971008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2688121795654297, "created_at": "2025-06-03T07:32:10.221024+00:00"} {"global_step": 234677, "acc_step": 0, "speed/wps": 5508.75931092985, "speed/FLOPS": 243458965156881.7, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05668458715081215, "optim/lr": 1.533820130857144e-05, "optim/total_tokens": 1968613359616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2628374099731445, "created_at": "2025-06-03T07:32:13.202411+00:00"} {"global_step": 234678, "acc_step": 0, "speed/wps": 5514.3972940655285, "speed/FLOPS": 243708135153665.0, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0016, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04789803549647331, "optim/lr": 1.5334654083476894e-05, "optim/total_tokens": 1968621748224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2712079286575317, "created_at": "2025-06-03T07:32:16.180057+00:00"} {"global_step": 234679, "acc_step": 0, "speed/wps": 5513.106065362151, "speed/FLOPS": 243651069454083.3, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.57 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.57, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04797161743044853, "optim/lr": 1.5331106858382348e-05, "optim/total_tokens": 1968630136832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.252375602722168, "created_at": "2025-06-03T07:32:19.156938+00:00"} {"global_step": 234680, "acc_step": 0, "speed/wps": 5533.487726167726, "speed/FLOPS": 244551834538892.66, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.001, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05659865960478783, "optim/lr": 1.53275596332878e-05, "optim/total_tokens": 1968638525440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2594654560089111, "created_at": "2025-06-03T07:32:22.125270+00:00"} {"global_step": 234681, "acc_step": 0, "speed/wps": 5537.6900608269, "speed/FLOPS": 244737556221329.47, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 192.7, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04522065073251724, "optim/lr": 1.532401240819348e-05, "optim/total_tokens": 1968646914048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2582298517227173, "created_at": "2025-06-03T07:32:25.088230+00:00"} {"global_step": 234682, "acc_step": 0, "speed/wps": 5537.812194168229, "speed/FLOPS": 244742953889881.12, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0533180832862854, "optim/lr": 1.532046518309893e-05, "optim/total_tokens": 1968655302656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2605348825454712, "created_at": "2025-06-03T07:32:28.051313+00:00"} {"global_step": 234683, "acc_step": 0, "speed/wps": 5527.801395445319, "speed/FLOPS": 244300527826241.38, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04871711879968643, "optim/lr": 1.5316917958004383e-05, "optim/total_tokens": 1968663691264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.270190954208374, "created_at": "2025-06-03T07:32:31.022389+00:00"} {"global_step": 234684, "acc_step": 0, "speed/wps": 5512.849734448453, "speed/FLOPS": 243639740939718.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04967864602804184, "optim/lr": 1.5313370732909836e-05, "optim/total_tokens": 1968672079872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2828292846679688, "created_at": "2025-06-03T07:32:33.998660+00:00"} {"global_step": 234685, "acc_step": 0, "speed/wps": 5516.8862278171255, "speed/FLOPS": 243818133285967.78, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0539107471704483, "optim/lr": 1.5309823507815513e-05, "optim/total_tokens": 1968680468480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.264515995979309, "created_at": "2025-06-03T07:32:36.972849+00:00"} {"global_step": 234686, "acc_step": 0, "speed/wps": 5515.967266364883, "speed/FLOPS": 243777519893449.75, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04851885512471199, "optim/lr": 1.5306276282720967e-05, "optim/total_tokens": 1968688857088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2811219692230225, "created_at": "2025-06-03T07:32:39.952957+00:00"} {"global_step": 234687, "acc_step": 0, "speed/wps": 5517.259631210585, "speed/FLOPS": 243834635804706.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04795442521572113, "optim/lr": 1.530272905762642e-05, "optim/total_tokens": 1968697245696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2740567922592163, "created_at": "2025-06-03T07:32:42.927614+00:00"} {"global_step": 234688, "acc_step": 0, "speed/wps": 5523.405018384957, "speed/FLOPS": 244106230462871.06, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.052495602518320084, "optim/lr": 1.529918183253187e-05, "optim/total_tokens": 1968705634304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2709308862686157, "created_at": "2025-06-03T07:32:45.901351+00:00"} {"global_step": 234689, "acc_step": 0, "speed/wps": 5535.606244869457, "speed/FLOPS": 244645462221947.47, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045291170477867126, "optim/lr": 1.5295634607437548e-05, "optim/total_tokens": 1968714022912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2829360961914062, "created_at": "2025-06-03T07:32:48.866039+00:00"} {"global_step": 234690, "acc_step": 0, "speed/wps": 5527.725721003936, "speed/FLOPS": 244297183403269.16, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.049616411328315735, "optim/lr": 1.5292087382343e-05, "optim/total_tokens": 1968722411520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2704905271530151, "created_at": "2025-06-03T07:32:51.837029+00:00"} {"global_step": 234691, "acc_step": 0, "speed/wps": 5522.756023027157, "speed/FLOPS": 244077548189915.72, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045279573649168015, "optim/lr": 1.5288540157248455e-05, "optim/total_tokens": 1968730800128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2838292121887207, "created_at": "2025-06-03T07:32:54.812989+00:00"} {"global_step": 234692, "acc_step": 0, "speed/wps": 5521.790715009392, "speed/FLOPS": 244034886516424.84, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04880484566092491, "optim/lr": 1.528499293215391e-05, "optim/total_tokens": 1968739188736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2629860639572144, "created_at": "2025-06-03T07:32:57.785043+00:00"} {"global_step": 234693, "acc_step": 0, "speed/wps": 5513.640676638706, "speed/FLOPS": 243674696536118.5, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04727151244878769, "optim/lr": 1.5281445707059583e-05, "optim/total_tokens": 1968747577344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.267990231513977, "created_at": "2025-06-03T07:33:00.760724+00:00"} {"global_step": 234694, "acc_step": 0, "speed/wps": 5505.028489635498, "speed/FLOPS": 243294081951745.84, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0014, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.56 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.56, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04583344981074333, "optim/lr": 1.5277898481965036e-05, "optim/total_tokens": 1968755965952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2731528282165527, "created_at": "2025-06-03T07:33:03.740280+00:00"} {"global_step": 234695, "acc_step": 0, "speed/wps": 5530.61995206248, "speed/FLOPS": 244425093602039.28, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.05, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.050846267491579056, "optim/lr": 1.527435125687049e-05, "optim/total_tokens": 1968764354560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.270156979560852, "created_at": "2025-06-03T07:33:06.707958+00:00"} {"global_step": 234696, "acc_step": 0, "speed/wps": 5527.764346743255, "speed/FLOPS": 244298890463242.6, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04517871513962746, "optim/lr": 1.5270804031775943e-05, "optim/total_tokens": 1968772743168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2638850212097168, "created_at": "2025-06-03T07:33:09.676189+00:00"} {"global_step": 234697, "acc_step": 0, "speed/wps": 5535.986324622027, "speed/FLOPS": 244662259801586.5, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04627028852701187, "optim/lr": 1.5267256806681617e-05, "optim/total_tokens": 1968781131776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2692723274230957, "created_at": "2025-06-03T07:33:12.643189+00:00"} {"global_step": 234698, "acc_step": 0, "speed/wps": 5515.283941754684, "speed/FLOPS": 243747320443251.38, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046864770352840424, "optim/lr": 1.526370958158707e-05, "optim/total_tokens": 1968789520384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2605782747268677, "created_at": "2025-06-03T07:33:15.621533+00:00"} {"global_step": 234699, "acc_step": 0, "speed/wps": 5514.269062777185, "speed/FLOPS": 243702467987067.47, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0463278666138649, "optim/lr": 1.5260162356492525e-05, "optim/total_tokens": 1968797908992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2727391719818115, "created_at": "2025-06-03T07:33:18.597064+00:00"} {"global_step": 234700, "acc_step": 0, "speed/wps": 5516.326614028128, "speed/FLOPS": 243793401220857.1, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.55 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.55, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04947695881128311, "optim/lr": 1.5256615131397978e-05, "optim/total_tokens": 1968806297600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.268558144569397, "created_at": "2025-06-03T07:33:21.571534+00:00"} {"global_step": 234701, "acc_step": 0, "speed/wps": 5523.093058902649, "speed/FLOPS": 244092443450506.47, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04582148790359497, "optim/lr": 1.5253067906303652e-05, "optim/total_tokens": 1968814686208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2671527862548828, "created_at": "2025-06-03T07:33:24.542742+00:00"} {"global_step": 234702, "acc_step": 0, "speed/wps": 5518.4874859693255, "speed/FLOPS": 243888900700312.8, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04523690789937973, "optim/lr": 1.5249520681209106e-05, "optim/total_tokens": 1968823074816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.276050090789795, "created_at": "2025-06-03T07:33:27.515878+00:00"} {"global_step": 234703, "acc_step": 0, "speed/wps": 5523.80852112394, "speed/FLOPS": 244124063218619.9, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04912634566426277, "optim/lr": 1.524597345611456e-05, "optim/total_tokens": 1968831463424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2801551818847656, "created_at": "2025-06-03T07:33:30.485949+00:00"} {"global_step": 234704, "acc_step": 0, "speed/wps": 5525.291173730423, "speed/FLOPS": 244189588874922.44, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04659604653716087, "optim/lr": 1.5242426231020235e-05, "optim/total_tokens": 1968839852032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2627654075622559, "created_at": "2025-06-03T07:33:33.455351+00:00"} {"global_step": 234705, "acc_step": 0, "speed/wps": 5533.909991106091, "speed/FLOPS": 244570496487820.5, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0466298945248127, "optim/lr": 1.5238879005925688e-05, "optim/total_tokens": 1968848240640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2727607488632202, "created_at": "2025-06-03T07:33:36.420357+00:00"} {"global_step": 234706, "acc_step": 0, "speed/wps": 5523.9743890245745, "speed/FLOPS": 244131393730839.06, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045812927186489105, "optim/lr": 1.523533178083114e-05, "optim/total_tokens": 1968856629248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2767621278762817, "created_at": "2025-06-03T07:33:39.390455+00:00"} {"global_step": 234707, "acc_step": 0, "speed/wps": 5523.92561211395, "speed/FLOPS": 244129238041052.28, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05898280069231987, "optim/lr": 1.5231784555736594e-05, "optim/total_tokens": 1968865017856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2704648971557617, "created_at": "2025-06-03T07:33:42.366250+00:00"} {"global_step": 234708, "acc_step": 0, "speed/wps": 5520.2456247279315, "speed/FLOPS": 243966601434473.25, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04599255323410034, "optim/lr": 1.522823733064227e-05, "optim/total_tokens": 1968873406464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2727770805358887, "created_at": "2025-06-03T07:33:45.343264+00:00"} {"global_step": 234709, "acc_step": 0, "speed/wps": 5511.072155799886, "speed/FLOPS": 243561181061924.1, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04747270420193672, "optim/lr": 1.5224690105547723e-05, "optim/total_tokens": 1968881795072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2815749645233154, "created_at": "2025-06-03T07:33:48.324823+00:00"} {"global_step": 234710, "acc_step": 0, "speed/wps": 5527.985609816436, "speed/FLOPS": 244308669158550.12, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05092743784189224, "optim/lr": 1.5221142880453177e-05, "optim/total_tokens": 1968890183680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2630542516708374, "created_at": "2025-06-03T07:33:51.296513+00:00"} {"global_step": 234711, "acc_step": 0, "speed/wps": 5513.368590808232, "speed/FLOPS": 243662671735073.06, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.54 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.54, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0450054369866848, "optim/lr": 1.5217595655358628e-05, "optim/total_tokens": 1968898572288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2771841287612915, "created_at": "2025-06-03T07:33:54.274021+00:00"} {"global_step": 234712, "acc_step": 0, "speed/wps": 5528.60555670789, "speed/FLOPS": 244336067637976.53, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046747591346502304, "optim/lr": 1.5214048430264304e-05, "optim/total_tokens": 1968906960896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2511011362075806, "created_at": "2025-06-03T07:33:57.241984+00:00"} {"global_step": 234713, "acc_step": 0, "speed/wps": 5527.0659734972005, "speed/FLOPS": 244268025940365.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0460643395781517, "optim/lr": 1.5210501205169758e-05, "optim/total_tokens": 1968915349504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2649834156036377, "created_at": "2025-06-03T07:34:00.210862+00:00"} {"global_step": 234714, "acc_step": 0, "speed/wps": 5536.246285609494, "speed/FLOPS": 244673748746631.62, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.047611091285943985, "optim/lr": 1.5206953980075211e-05, "optim/total_tokens": 1968923738112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2834171056747437, "created_at": "2025-06-03T07:34:03.174643+00:00"} {"global_step": 234715, "acc_step": 0, "speed/wps": 5524.138936851208, "speed/FLOPS": 244138665902544.12, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05237045884132385, "optim/lr": 1.5203406754980665e-05, "optim/total_tokens": 1968932126720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2498193979263306, "created_at": "2025-06-03T07:34:06.144784+00:00"} {"global_step": 234716, "acc_step": 0, "speed/wps": 5526.576607641827, "speed/FLOPS": 244246398474359.28, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046291451901197433, "optim/lr": 1.519985952988634e-05, "optim/total_tokens": 1968940515328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.258381962776184, "created_at": "2025-06-03T07:34:09.113549+00:00"} {"global_step": 234717, "acc_step": 0, "speed/wps": 5523.690570953536, "speed/FLOPS": 244118850424811.72, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04745710641145706, "optim/lr": 1.5196312304791792e-05, "optim/total_tokens": 1968948903936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.286528468132019, "created_at": "2025-06-03T07:34:12.084096+00:00"} {"global_step": 234718, "acc_step": 0, "speed/wps": 5519.107649924031, "speed/FLOPS": 243916308772823.9, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04546457156538963, "optim/lr": 1.5192765079697246e-05, "optim/total_tokens": 1968957292544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2654815912246704, "created_at": "2025-06-03T07:34:15.056870+00:00"} {"global_step": 234719, "acc_step": 0, "speed/wps": 5514.686246407036, "speed/FLOPS": 243720905368167.47, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.052416395395994186, "optim/lr": 1.51892178546027e-05, "optim/total_tokens": 1968965681152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2774559259414673, "created_at": "2025-06-03T07:34:18.033019+00:00"} {"global_step": 234720, "acc_step": 0, "speed/wps": 5516.946927764751, "speed/FLOPS": 243820815912962.34, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04613985866308212, "optim/lr": 1.5185670629508375e-05, "optim/total_tokens": 1968974069760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2586236000061035, "created_at": "2025-06-03T07:34:21.010396+00:00"} {"global_step": 234721, "acc_step": 0, "speed/wps": 5511.19864054766, "speed/FLOPS": 243566771040368.1, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.53 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.53, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05392155796289444, "optim/lr": 1.5182123404413829e-05, "optim/total_tokens": 1968982458368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2697534561157227, "created_at": "2025-06-03T07:34:23.987699+00:00"} {"global_step": 234722, "acc_step": 0, "speed/wps": 5533.782285937958, "speed/FLOPS": 244564852573043.3, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 192.99, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04556158930063248, "optim/lr": 1.517857617931928e-05, "optim/total_tokens": 1968990846976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2667624950408936, "created_at": "2025-06-03T07:34:26.953272+00:00"} {"global_step": 234723, "acc_step": 0, "speed/wps": 5532.891824080164, "speed/FLOPS": 244525498716725.8, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.01, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05662589147686958, "optim/lr": 1.5175028954224734e-05, "optim/total_tokens": 1968999235584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2749537229537964, "created_at": "2025-06-03T07:34:29.918623+00:00"} {"global_step": 234724, "acc_step": 0, "speed/wps": 5525.5216196952615, "speed/FLOPS": 244199773407038.94, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04516689106822014, "optim/lr": 1.517148172913041e-05, "optim/total_tokens": 1969007624192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.270337462425232, "created_at": "2025-06-03T07:34:32.888543+00:00"} {"global_step": 234725, "acc_step": 0, "speed/wps": 5523.08571202515, "speed/FLOPS": 244092118756125.72, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05036969855427742, "optim/lr": 1.5167934504035863e-05, "optim/total_tokens": 1969016012800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2776246070861816, "created_at": "2025-06-03T07:34:35.859345+00:00"} {"global_step": 234726, "acc_step": 0, "speed/wps": 5530.006007747472, "speed/FLOPS": 244397960405767.8, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05028466135263443, "optim/lr": 1.5164387278941317e-05, "optim/total_tokens": 1969024401408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2701913118362427, "created_at": "2025-06-03T07:34:38.826888+00:00"} {"global_step": 234727, "acc_step": 0, "speed/wps": 5530.276202981006, "speed/FLOPS": 244409901652105.44, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.050889816135168076, "optim/lr": 1.5160840053846769e-05, "optim/total_tokens": 1969032790016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2916096448898315, "created_at": "2025-06-03T07:34:41.794000+00:00"} {"global_step": 234728, "acc_step": 0, "speed/wps": 5521.086657281481, "speed/FLOPS": 244003770768545.28, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04617524892091751, "optim/lr": 1.5157292828752444e-05, "optim/total_tokens": 1969041178624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2620967626571655, "created_at": "2025-06-03T07:34:44.768584+00:00"} {"global_step": 234729, "acc_step": 0, "speed/wps": 5516.53413495171, "speed/FLOPS": 243802572583491.06, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04506848379969597, "optim/lr": 1.5153745603657898e-05, "optim/total_tokens": 1969049567232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2554335594177246, "created_at": "2025-06-03T07:34:47.745703+00:00"} {"global_step": 234730, "acc_step": 0, "speed/wps": 5515.996340477706, "speed/FLOPS": 243778804820421.75, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045924510806798935, "optim/lr": 1.5150198378563352e-05, "optim/total_tokens": 1969057955840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.28010892868042, "created_at": "2025-06-03T07:34:50.723914+00:00"} {"global_step": 234731, "acc_step": 0, "speed/wps": 5527.395591591565, "speed/FLOPS": 244282593372997.84, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045274898409843445, "optim/lr": 1.5146651153469027e-05, "optim/total_tokens": 1969066344448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2695655822753906, "created_at": "2025-06-03T07:34:53.692366+00:00"} {"global_step": 234732, "acc_step": 0, "speed/wps": 5523.508062633685, "speed/FLOPS": 244110784491236.56, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04850494861602783, "optim/lr": 1.514310392837448e-05, "optim/total_tokens": 1969074733056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2702174186706543, "created_at": "2025-06-03T07:34:56.666745+00:00"} {"global_step": 234733, "acc_step": 0, "speed/wps": 5532.917775366199, "speed/FLOPS": 244526645630737.8, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04534537345170975, "optim/lr": 1.5139556703279933e-05, "optim/total_tokens": 1969083121664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2653642892837524, "created_at": "2025-06-03T07:34:59.632142+00:00"} {"global_step": 234734, "acc_step": 0, "speed/wps": 5530.47008865281, "speed/FLOPS": 244418470406402.34, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045934926718473434, "optim/lr": 1.5136009478185386e-05, "optim/total_tokens": 1969091510272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2577037811279297, "created_at": "2025-06-03T07:35:02.604211+00:00"} {"global_step": 234735, "acc_step": 0, "speed/wps": 5518.738005924213, "speed/FLOPS": 243899972400041.47, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04746335744857788, "optim/lr": 1.5132462253091062e-05, "optim/total_tokens": 1969099898880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2707958221435547, "created_at": "2025-06-03T07:35:05.577481+00:00"} {"global_step": 234736, "acc_step": 0, "speed/wps": 5519.265101948033, "speed/FLOPS": 243923267346372.28, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.52 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.52, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04648495465517044, "optim/lr": 1.5128915027996515e-05, "optim/total_tokens": 1969108287488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2572919130325317, "created_at": "2025-06-03T07:35:08.552542+00:00"} {"global_step": 234737, "acc_step": 0, "speed/wps": 5524.339483702801, "speed/FLOPS": 244147529046892.7, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04605992138385773, "optim/lr": 1.5125367802901969e-05, "optim/total_tokens": 1969116676096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.258154273033142, "created_at": "2025-06-03T07:35:11.522950+00:00"} {"global_step": 234738, "acc_step": 0, "speed/wps": 5528.360717490296, "speed/FLOPS": 244325246997759.62, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04674571380019188, "optim/lr": 1.512182057780742e-05, "optim/total_tokens": 1969125064704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2753443717956543, "created_at": "2025-06-03T07:35:14.495192+00:00"} {"global_step": 234739, "acc_step": 0, "speed/wps": 5527.113392799114, "speed/FLOPS": 244270121630795.88, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046220578253269196, "optim/lr": 1.5118273352713096e-05, "optim/total_tokens": 1969133453312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2844942808151245, "created_at": "2025-06-03T07:35:17.463577+00:00"} {"global_step": 234740, "acc_step": 0, "speed/wps": 5522.5201300592225, "speed/FLOPS": 244067122928142.66, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0454741008579731, "optim/lr": 1.511472612761855e-05, "optim/total_tokens": 1969141841920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2718822956085205, "created_at": "2025-06-03T07:35:20.435191+00:00"} {"global_step": 234741, "acc_step": 0, "speed/wps": 5537.6028557814725, "speed/FLOPS": 244733702204677.47, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04605834558606148, "optim/lr": 1.5111178902524004e-05, "optim/total_tokens": 1969150230528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2592599391937256, "created_at": "2025-06-03T07:35:23.401765+00:00"} {"global_step": 234742, "acc_step": 0, "speed/wps": 5525.634506419166, "speed/FLOPS": 244204762422428.9, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04531603306531906, "optim/lr": 1.5107631677429457e-05, "optim/total_tokens": 1969158619136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2653238773345947, "created_at": "2025-06-03T07:35:26.372356+00:00"} {"global_step": 234743, "acc_step": 0, "speed/wps": 5517.024807903453, "speed/FLOPS": 243824257816466.25, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0457361564040184, "optim/lr": 1.5104084452335131e-05, "optim/total_tokens": 1969167007744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2669545412063599, "created_at": "2025-06-03T07:35:29.348196+00:00"} {"global_step": 234744, "acc_step": 0, "speed/wps": 5524.667005694924, "speed/FLOPS": 244162003842535.0, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04846978560090065, "optim/lr": 1.5100537227240585e-05, "optim/total_tokens": 1969175396352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2501353025436401, "created_at": "2025-06-03T07:35:32.318213+00:00"} {"global_step": 234745, "acc_step": 0, "speed/wps": 5516.730966717969, "speed/FLOPS": 243811271540083.4, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.51 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.51, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04957157000899315, "optim/lr": 1.5096990002146038e-05, "optim/total_tokens": 1969183784960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2712074518203735, "created_at": "2025-06-03T07:35:35.292350+00:00"} {"global_step": 234746, "acc_step": 0, "speed/wps": 5536.450068221557, "speed/FLOPS": 244682754895030.8, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 192.91, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04696483165025711, "optim/lr": 1.5093442777051492e-05, "optim/total_tokens": 1969192173568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2648695707321167, "created_at": "2025-06-03T07:35:38.256103+00:00"} {"global_step": 234747, "acc_step": 0, "speed/wps": 5530.621037019409, "speed/FLOPS": 244425141551582.28, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046775445342063904, "optim/lr": 1.5089895551957167e-05, "optim/total_tokens": 1969200562176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.290600299835205, "created_at": "2025-06-03T07:35:41.223815+00:00"} {"global_step": 234748, "acc_step": 0, "speed/wps": 5533.717441646641, "speed/FLOPS": 244561986787270.3, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04676497355103493, "optim/lr": 1.508634832686262e-05, "optim/total_tokens": 1969208950784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2738795280456543, "created_at": "2025-06-03T07:35:44.189496+00:00"} {"global_step": 234749, "acc_step": 0, "speed/wps": 5524.894738796885, "speed/FLOPS": 244172068479997.97, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04457265883684158, "optim/lr": 1.5082801101768073e-05, "optim/total_tokens": 1969217339392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2783766984939575, "created_at": "2025-06-03T07:35:47.159358+00:00"} {"global_step": 234750, "acc_step": 0, "speed/wps": 5524.640045233235, "speed/FLOPS": 244160812328124.47, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04906183108687401, "optim/lr": 1.5079253876673526e-05, "optim/total_tokens": 1969225728000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2705154418945312, "created_at": "2025-06-03T07:35:50.133357+00:00"} {"global_step": 234751, "acc_step": 0, "speed/wps": 5520.427396520018, "speed/FLOPS": 243974634817291.1, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04595188796520233, "optim/lr": 1.5075706651579202e-05, "optim/total_tokens": 1969234116608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2632323503494263, "created_at": "2025-06-03T07:35:53.105295+00:00"} {"global_step": 234752, "acc_step": 0, "speed/wps": 5521.378002423143, "speed/FLOPS": 244016646732567.12, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.052270326763391495, "optim/lr": 1.5072159426484656e-05, "optim/total_tokens": 1969242505216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2651524543762207, "created_at": "2025-06-03T07:35:56.076599+00:00"} {"global_step": 234753, "acc_step": 0, "speed/wps": 5519.779007145814, "speed/FLOPS": 243945979325708.94, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04613983631134033, "optim/lr": 1.5068612201390108e-05, "optim/total_tokens": 1969250893824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.266190767288208, "created_at": "2025-06-03T07:35:59.052244+00:00"} {"global_step": 234754, "acc_step": 0, "speed/wps": 5516.789693611882, "speed/FLOPS": 243813866968202.88, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04863706976175308, "optim/lr": 1.5065064976295561e-05, "optim/total_tokens": 1969259282432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2561476230621338, "created_at": "2025-06-03T07:36:02.026443+00:00"} {"global_step": 234755, "acc_step": 0, "speed/wps": 5511.046325735624, "speed/FLOPS": 243560039505293.97, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04724862799048424, "optim/lr": 1.5061517751201237e-05, "optim/total_tokens": 1969267671040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2829821109771729, "created_at": "2025-06-03T07:36:05.007048+00:00"} {"global_step": 234756, "acc_step": 0, "speed/wps": 5528.368497965542, "speed/FLOPS": 244325590854941.38, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.044784847646951675, "optim/lr": 1.505797052610669e-05, "optim/total_tokens": 1969276059648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2745078802108765, "created_at": "2025-06-03T07:36:07.975305+00:00"} {"global_step": 234757, "acc_step": 0, "speed/wps": 5532.495228162395, "speed/FLOPS": 244507971207122.3, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0525527261197567, "optim/lr": 1.5054423301012144e-05, "optim/total_tokens": 1969284448256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2685847282409668, "created_at": "2025-06-03T07:36:10.941196+00:00"} {"global_step": 234758, "acc_step": 0, "speed/wps": 5522.603804235771, "speed/FLOPS": 244070820898462.84, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04715127497911453, "optim/lr": 1.505087607591782e-05, "optim/total_tokens": 1969292836864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2700250148773193, "created_at": "2025-06-03T07:36:13.912826+00:00"} {"global_step": 234759, "acc_step": 0, "speed/wps": 5526.2590150515425, "speed/FLOPS": 244232362507454.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04838194325566292, "optim/lr": 1.5047328850823271e-05, "optim/total_tokens": 1969301225472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2561954259872437, "created_at": "2025-06-03T07:36:16.882591+00:00"} {"global_step": 234760, "acc_step": 0, "speed/wps": 5524.177624799841, "speed/FLOPS": 244140375711850.84, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.35, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05378827080130577, "optim/lr": 1.5043781625728725e-05, "optim/total_tokens": 1969309614080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2709261178970337, "created_at": "2025-06-03T07:36:19.853006+00:00"} {"global_step": 234761, "acc_step": 0, "speed/wps": 5520.124521344565, "speed/FLOPS": 243961249284791.78, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045821595937013626, "optim/lr": 1.5040234400634179e-05, "optim/total_tokens": 1969318002688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.259751319885254, "created_at": "2025-06-03T07:36:22.829171+00:00"} {"global_step": 234762, "acc_step": 0, "speed/wps": 5508.727038191526, "speed/FLOPS": 243457538867034.62, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.5 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.5, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05198175087571144, "optim/lr": 1.5036687175539854e-05, "optim/total_tokens": 1969326391296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2690836191177368, "created_at": "2025-06-03T07:36:25.807508+00:00"} {"global_step": 234763, "acc_step": 0, "speed/wps": 5530.42434597948, "speed/FLOPS": 244416448814373.38, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0458090640604496, "optim/lr": 1.5033139950445308e-05, "optim/total_tokens": 1969334779904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.265508770942688, "created_at": "2025-06-03T07:36:28.777418+00:00"} {"global_step": 234764, "acc_step": 0, "speed/wps": 5530.717622060334, "speed/FLOPS": 244429410116024.1, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05146944895386696, "optim/lr": 1.502959272535076e-05, "optim/total_tokens": 1969343168512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2647124528884888, "created_at": "2025-06-03T07:36:31.744167+00:00"} {"global_step": 234765, "acc_step": 0, "speed/wps": 5527.749285537006, "speed/FLOPS": 244298224835016.6, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04558875411748886, "optim/lr": 1.5026045500256213e-05, "optim/total_tokens": 1969351557120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.264121651649475, "created_at": "2025-06-03T07:36:34.711955+00:00"} {"global_step": 234766, "acc_step": 0, "speed/wps": 5526.786636362444, "speed/FLOPS": 244255680668786.12, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04687916114926338, "optim/lr": 1.5022498275161889e-05, "optim/total_tokens": 1969359945728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2666723728179932, "created_at": "2025-06-03T07:36:37.681797+00:00"} {"global_step": 234767, "acc_step": 0, "speed/wps": 5517.222128024912, "speed/FLOPS": 243832978355858.8, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04851122945547104, "optim/lr": 1.5018951050067342e-05, "optim/total_tokens": 1969368334336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2747694253921509, "created_at": "2025-06-03T07:36:40.655261+00:00"} {"global_step": 234768, "acc_step": 0, "speed/wps": 5520.131200406805, "speed/FLOPS": 243961544465156.22, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.045974913984537125, "optim/lr": 1.5015403824972796e-05, "optim/total_tokens": 1969376722944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2649223804473877, "created_at": "2025-06-03T07:36:43.631547+00:00"} {"global_step": 234769, "acc_step": 0, "speed/wps": 5509.0534149538125, "speed/FLOPS": 243471963049380.0, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.046945296227931976, "optim/lr": 1.5011856599878248e-05, "optim/total_tokens": 1969385111552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.262603521347046, "created_at": "2025-06-03T07:36:46.612957+00:00"} {"global_step": 234770, "acc_step": 0, "speed/wps": 5515.4572380999425, "speed/FLOPS": 243754979254700.72, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.49 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.49, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04568781703710556, "optim/lr": 1.5008309374783923e-05, "optim/total_tokens": 1969393500160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2576758861541748, "created_at": "2025-06-03T07:36:49.587394+00:00"} {"global_step": 234771, "acc_step": 0, "speed/wps": 5537.613451271684, "speed/FLOPS": 244734170471112.2, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04642850533127785, "optim/lr": 1.5004762149689377e-05, "optim/total_tokens": 1969401888768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.267881155014038, "created_at": "2025-06-03T07:36:52.550719+00:00"} {"global_step": 234772, "acc_step": 0, "speed/wps": 5532.7799387285, "speed/FLOPS": 244520553956863.4, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04682736098766327, "optim/lr": 1.500121492459483e-05, "optim/total_tokens": 1969410277376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2756739854812622, "created_at": "2025-06-03T07:36:55.516017+00:00"} {"global_step": 234773, "acc_step": 0, "speed/wps": 5523.287381544236, "speed/FLOPS": 244101031516631.16, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04929176717996597, "optim/lr": 1.4997667699500284e-05, "optim/total_tokens": 1969418665984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2703721523284912, "created_at": "2025-06-03T07:36:58.486696+00:00"} {"global_step": 234774, "acc_step": 0, "speed/wps": 5533.147051522001, "speed/FLOPS": 244536778463282.5, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04644755274057388, "optim/lr": 1.499412047440596e-05, "optim/total_tokens": 1969427054592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2520123720169067, "created_at": "2025-06-03T07:37:01.451788+00:00"} {"global_step": 234775, "acc_step": 0, "speed/wps": 5518.177143177186, "speed/FLOPS": 243875185137378.62, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.04702885076403618, "optim/lr": 1.4990573249311412e-05, "optim/total_tokens": 1969435443200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2641006708145142, "created_at": "2025-06-03T07:37:04.428458+00:00"} {"global_step": 234776, "acc_step": 0, "speed/wps": 5533.39958086478, "speed/FLOPS": 244547938967671.0, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.04, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04561315476894379, "optim/lr": 1.4987026024216865e-05, "optim/total_tokens": 1969443831808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2755497694015503, "created_at": "2025-06-03T07:37:07.394481+00:00"} {"global_step": 234777, "acc_step": 0, "speed/wps": 5524.463048646531, "speed/FLOPS": 244152989984942.84, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04685874655842781, "optim/lr": 1.4983478799122319e-05, "optim/total_tokens": 1969452220416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2515954971313477, "created_at": "2025-06-03T07:37:10.364367+00:00"} {"global_step": 234778, "acc_step": 0, "speed/wps": 5512.407963444555, "speed/FLOPS": 243620216922535.12, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.0456237867474556, "optim/lr": 1.4979931574027994e-05, "optim/total_tokens": 1969460609024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2713558673858643, "created_at": "2025-06-03T07:37:13.340888+00:00"} {"global_step": 234779, "acc_step": 0, "speed/wps": 5522.859155327767, "speed/FLOPS": 244082106109723.72, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045166466385126114, "optim/lr": 1.4976384348933448e-05, "optim/total_tokens": 1969468997632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2660940885543823, "created_at": "2025-06-03T07:37:16.314050+00:00"} {"global_step": 234780, "acc_step": 0, "speed/wps": 5532.757520178797, "speed/FLOPS": 244519563171715.06, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047567468136548996, "optim/lr": 1.49728371238389e-05, "optim/total_tokens": 1969477386240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2783452272415161, "created_at": "2025-06-03T07:37:19.281128+00:00"} {"global_step": 234781, "acc_step": 0, "speed/wps": 5536.489476354134, "speed/FLOPS": 244684496532781.62, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04645753651857376, "optim/lr": 1.4969289898744353e-05, "optim/total_tokens": 1969485774848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2960790395736694, "created_at": "2025-06-03T07:37:22.245593+00:00"} {"global_step": 234782, "acc_step": 0, "speed/wps": 5531.626063804847, "speed/FLOPS": 244469558591305.2, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.0, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04833332076668739, "optim/lr": 1.4965742673650029e-05, "optim/total_tokens": 1969494163456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.268892526626587, "created_at": "2025-06-03T07:37:25.212399+00:00"} {"global_step": 234783, "acc_step": 0, "speed/wps": 5531.788422108456, "speed/FLOPS": 244476733997299.56, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04757620766758919, "optim/lr": 1.4962195448555483e-05, "optim/total_tokens": 1969502552064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.265109896659851, "created_at": "2025-06-03T07:37:28.182396+00:00"} {"global_step": 234784, "acc_step": 0, "speed/wps": 5528.598943560638, "speed/FLOPS": 244335775370717.16, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04958502575755119, "optim/lr": 1.4958648223460936e-05, "optim/total_tokens": 1969510940672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2567222118377686, "created_at": "2025-06-03T07:37:31.150331+00:00"} {"global_step": 234785, "acc_step": 0, "speed/wps": 5514.8561184422515, "speed/FLOPS": 243728412842640.1, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04538718983530998, "optim/lr": 1.495510099836661e-05, "optim/total_tokens": 1969519329280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.27791166305542, "created_at": "2025-06-03T07:37:34.128006+00:00"} {"global_step": 234786, "acc_step": 0, "speed/wps": 5523.668192182796, "speed/FLOPS": 244117861397689.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04808253049850464, "optim/lr": 1.4951553773272064e-05, "optim/total_tokens": 1969527717888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2856804132461548, "created_at": "2025-06-03T07:37:37.098624+00:00"} {"global_step": 234787, "acc_step": 0, "speed/wps": 5503.486659814552, "speed/FLOPS": 243225940965460.44, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.48 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.48, "speed/est_time_remaining_days": 0.15, "optim/grad_norm": 0.05019696056842804, "optim/lr": 1.4948006548177517e-05, "optim/total_tokens": 1969536106496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2630813121795654, "created_at": "2025-06-03T07:37:40.080160+00:00"} {"global_step": 234788, "acc_step": 0, "speed/wps": 5531.819367921423, "speed/FLOPS": 244478101643837.7, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04571853578090668, "optim/lr": 1.4944459323082971e-05, "optim/total_tokens": 1969544495104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.266501784324646, "created_at": "2025-06-03T07:37:43.046342+00:00"} {"global_step": 234789, "acc_step": 0, "speed/wps": 5533.314790392816, "speed/FLOPS": 244544191662807.16, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04999702796339989, "optim/lr": 1.4940912097988646e-05, "optim/total_tokens": 1969552883712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2674493789672852, "created_at": "2025-06-03T07:37:46.014208+00:00"} {"global_step": 234790, "acc_step": 0, "speed/wps": 5523.491152940314, "speed/FLOPS": 244110037169341.25, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05029485374689102, "optim/lr": 1.49373648728941e-05, "optim/total_tokens": 1969561272320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2747828960418701, "created_at": "2025-06-03T07:37:48.984746+00:00"} {"global_step": 234791, "acc_step": 0, "speed/wps": 5519.44367177522, "speed/FLOPS": 243931159218730.7, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04840102791786194, "optim/lr": 1.4933817647799552e-05, "optim/total_tokens": 1969569660928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2615660429000854, "created_at": "2025-06-03T07:37:51.957395+00:00"} {"global_step": 234792, "acc_step": 0, "speed/wps": 5531.468233589064, "speed/FLOPS": 244462583303615.84, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05397497117519379, "optim/lr": 1.4930270422705006e-05, "optim/total_tokens": 1969578049536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2628397941589355, "created_at": "2025-06-03T07:37:54.923901+00:00"} {"global_step": 234793, "acc_step": 0, "speed/wps": 5529.050547319214, "speed/FLOPS": 244355733945328.62, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048086173832416534, "optim/lr": 1.4926723197610681e-05, "optim/total_tokens": 1969586438144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.284187912940979, "created_at": "2025-06-03T07:37:57.891191+00:00"} {"global_step": 234794, "acc_step": 0, "speed/wps": 5515.707765315138, "speed/FLOPS": 243766051275297.8, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.47 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.47, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05720331519842148, "optim/lr": 1.4923175972516135e-05, "optim/total_tokens": 1969594826752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2752294540405273, "created_at": "2025-06-03T07:38:00.868109+00:00"} {"global_step": 234795, "acc_step": 0, "speed/wps": 5519.012635632468, "speed/FLOPS": 243912109627464.06, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046403512358665466, "optim/lr": 1.4919628747421588e-05, "optim/total_tokens": 1969603215360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2675174474716187, "created_at": "2025-06-03T07:38:03.843315+00:00"} {"global_step": 234796, "acc_step": 0, "speed/wps": 5525.50835349981, "speed/FLOPS": 244199187109102.53, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05408896133303642, "optim/lr": 1.491608152232704e-05, "optim/total_tokens": 1969611603968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2720993757247925, "created_at": "2025-06-03T07:38:06.812641+00:00"} {"global_step": 234797, "acc_step": 0, "speed/wps": 5522.291916613876, "speed/FLOPS": 244057037061960.66, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04525580257177353, "optim/lr": 1.4912534297232716e-05, "optim/total_tokens": 1969619992576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.259399652481079, "created_at": "2025-06-03T07:38:09.783657+00:00"} {"global_step": 234798, "acc_step": 0, "speed/wps": 5538.602094222131, "speed/FLOPS": 244777863429188.6, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04904535040259361, "optim/lr": 1.490898707213817e-05, "optim/total_tokens": 1969628381184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.268559455871582, "created_at": "2025-06-03T07:38:12.746345+00:00"} {"global_step": 234799, "acc_step": 0, "speed/wps": 5524.873314116542, "speed/FLOPS": 244171121618788.28, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04975835978984833, "optim/lr": 1.4905439847043623e-05, "optim/total_tokens": 1969636769792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.276825189590454, "created_at": "2025-06-03T07:38:15.721330+00:00"} {"global_step": 234800, "acc_step": 0, "speed/wps": 5523.953591140085, "speed/FLOPS": 244130474570797.84, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.051190707832574844, "optim/lr": 1.4901892621949077e-05, "optim/total_tokens": 1969645158400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.249833345413208, "created_at": "2025-06-03T07:38:18.692133+00:00"} {"global_step": 234801, "acc_step": 0, "speed/wps": 5529.9243397584305, "speed/FLOPS": 244394351098666.84, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0451592318713665, "optim/lr": 1.489834539685475e-05, "optim/total_tokens": 1969653547008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2617995738983154, "created_at": "2025-06-03T07:38:21.658895+00:00"} {"global_step": 234802, "acc_step": 0, "speed/wps": 5525.309046733697, "speed/FLOPS": 244190378770184.8, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04561013728380203, "optim/lr": 1.4894798171760204e-05, "optim/total_tokens": 1969661935616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.26460862159729, "created_at": "2025-06-03T07:38:24.632421+00:00"} {"global_step": 234803, "acc_step": 0, "speed/wps": 5525.732175709962, "speed/FLOPS": 244209078905165.28, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04580596089363098, "optim/lr": 1.4891250946665658e-05, "optim/total_tokens": 1969670324224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2773045301437378, "created_at": "2025-06-03T07:38:27.605545+00:00"} {"global_step": 234804, "acc_step": 0, "speed/wps": 5518.778534347656, "speed/FLOPS": 243901763548914.38, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046481627970933914, "optim/lr": 1.4887703721571111e-05, "optim/total_tokens": 1969678712832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2624680995941162, "created_at": "2025-06-03T07:38:30.578683+00:00"} {"global_step": 234805, "acc_step": 0, "speed/wps": 5521.267778767967, "speed/FLOPS": 244011775411184.16, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04582799971103668, "optim/lr": 1.4884156496476787e-05, "optim/total_tokens": 1969687101440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.258463978767395, "created_at": "2025-06-03T07:38:33.553627+00:00"} {"global_step": 234806, "acc_step": 0, "speed/wps": 5536.022112576955, "speed/FLOPS": 244663841446014.97, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04739127680659294, "optim/lr": 1.4880609271382239e-05, "optim/total_tokens": 1969695490048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.26627779006958, "created_at": "2025-06-03T07:38:36.520401+00:00"} {"global_step": 234807, "acc_step": 0, "speed/wps": 5524.384727205071, "speed/FLOPS": 244149528578115.78, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045838482677936554, "optim/lr": 1.4877062046287692e-05, "optim/total_tokens": 1969703878656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2678136825561523, "created_at": "2025-06-03T07:38:39.494309+00:00"} {"global_step": 234808, "acc_step": 0, "speed/wps": 5524.293136781322, "speed/FLOPS": 244145480750188.34, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045588020235300064, "optim/lr": 1.4873514821193146e-05, "optim/total_tokens": 1969712267264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2686411142349243, "created_at": "2025-06-03T07:38:42.469405+00:00"} {"global_step": 234809, "acc_step": 0, "speed/wps": 5522.006553265356, "speed/FLOPS": 244044425462578.1, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04633268713951111, "optim/lr": 1.4869967596098821e-05, "optim/total_tokens": 1969720655872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2801982164382935, "created_at": "2025-06-03T07:38:45.441427+00:00"} {"global_step": 234810, "acc_step": 0, "speed/wps": 5533.522877858053, "speed/FLOPS": 244553388063682.47, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04634493961930275, "optim/lr": 1.4866420371004275e-05, "optim/total_tokens": 1969729044480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2711219787597656, "created_at": "2025-06-03T07:38:48.406662+00:00"} {"global_step": 234811, "acc_step": 0, "speed/wps": 5515.48341386908, "speed/FLOPS": 243756136089716.88, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046613458544015884, "optim/lr": 1.4862873145909729e-05, "optim/total_tokens": 1969737433088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2641886472702026, "created_at": "2025-06-03T07:38:51.383282+00:00"} {"global_step": 234812, "acc_step": 0, "speed/wps": 5516.986361517324, "speed/FLOPS": 243822558682985.8, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045744992792606354, "optim/lr": 1.4859325920815402e-05, "optim/total_tokens": 1969745821696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2732881307601929, "created_at": "2025-06-03T07:38:54.357106+00:00"} {"global_step": 234813, "acc_step": 0, "speed/wps": 5513.048393439033, "speed/FLOPS": 243648520650273.2, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.46 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.46, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047271810472011566, "optim/lr": 1.4855778695720856e-05, "optim/total_tokens": 1969754210304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2695080041885376, "created_at": "2025-06-03T07:38:57.337001+00:00"} {"global_step": 234814, "acc_step": 0, "speed/wps": 5522.666876960055, "speed/FLOPS": 244073608390040.7, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045874956995248795, "optim/lr": 1.485223147062631e-05, "optim/total_tokens": 1969762598912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2776165008544922, "created_at": "2025-06-03T07:39:00.310514+00:00"} {"global_step": 234815, "acc_step": 0, "speed/wps": 5529.673568409153, "speed/FLOPS": 244383268288592.9, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05104013532400131, "optim/lr": 1.4848684245531763e-05, "optim/total_tokens": 1969770987520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2780355215072632, "created_at": "2025-06-03T07:39:03.277919+00:00"} {"global_step": 234816, "acc_step": 0, "speed/wps": 5515.54528045481, "speed/FLOPS": 243758870276144.25, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046961743384599686, "optim/lr": 1.4845137020437439e-05, "optim/total_tokens": 1969779376128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2725415229797363, "created_at": "2025-06-03T07:39:06.256367+00:00"} {"global_step": 234817, "acc_step": 0, "speed/wps": 5520.088342361254, "speed/FLOPS": 243959650358910.22, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04606263339519501, "optim/lr": 1.484158979534289e-05, "optim/total_tokens": 1969787764736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.27211594581604, "created_at": "2025-06-03T07:39:09.234706+00:00"} {"global_step": 234818, "acc_step": 0, "speed/wps": 5514.7856597516175, "speed/FLOPS": 243725298929154.34, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048850167542696, "optim/lr": 1.4838042570248344e-05, "optim/total_tokens": 1969796153344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2840791940689087, "created_at": "2025-06-03T07:39:12.209900+00:00"} {"global_step": 234819, "acc_step": 0, "speed/wps": 5518.75828369522, "speed/FLOPS": 243900868573728.9, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046853844076395035, "optim/lr": 1.4834495345153798e-05, "optim/total_tokens": 1969804541952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.290396809577942, "created_at": "2025-06-03T07:39:15.187863+00:00"} {"global_step": 234820, "acc_step": 0, "speed/wps": 5524.312717260041, "speed/FLOPS": 244146346107125.75, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.052599623799324036, "optim/lr": 1.4830948120059473e-05, "optim/total_tokens": 1969812930560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.269649624824524, "created_at": "2025-06-03T07:39:18.160844+00:00"} {"global_step": 234821, "acc_step": 0, "speed/wps": 5513.738994251002, "speed/FLOPS": 243679041671346.8, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047287069261074066, "optim/lr": 1.4827400894964927e-05, "optim/total_tokens": 1969821319168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2710176706314087, "created_at": "2025-06-03T07:39:21.139101+00:00"} {"global_step": 234822, "acc_step": 0, "speed/wps": 5530.147760188408, "speed/FLOPS": 244404225138102.44, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04826415330171585, "optim/lr": 1.4823853669870379e-05, "optim/total_tokens": 1969829707776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2705515623092651, "created_at": "2025-06-03T07:39:24.111675+00:00"} {"global_step": 234823, "acc_step": 0, "speed/wps": 5520.177127624964, "speed/FLOPS": 243963574213122.03, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04598844423890114, "optim/lr": 1.4820306444775833e-05, "optim/total_tokens": 1969838096384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2748152017593384, "created_at": "2025-06-03T07:39:27.084333+00:00"} {"global_step": 234824, "acc_step": 0, "speed/wps": 5529.936018385976, "speed/FLOPS": 244394867234227.75, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047339215874671936, "optim/lr": 1.4816759219681508e-05, "optim/total_tokens": 1969846484992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2731947898864746, "created_at": "2025-06-03T07:39:30.051595+00:00"} {"global_step": 234825, "acc_step": 0, "speed/wps": 5531.36291163411, "speed/FLOPS": 244457928612293.53, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04657243192195892, "optim/lr": 1.4813211994586962e-05, "optim/total_tokens": 1969854873600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.274618148803711, "created_at": "2025-06-03T07:39:33.018487+00:00"} {"global_step": 234826, "acc_step": 0, "speed/wps": 5523.890220610798, "speed/FLOPS": 244127673917763.12, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04845936968922615, "optim/lr": 1.4809664769492415e-05, "optim/total_tokens": 1969863262208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2869600057601929, "created_at": "2025-06-03T07:39:35.988781+00:00"} {"global_step": 234827, "acc_step": 0, "speed/wps": 5522.89558910672, "speed/FLOPS": 244083716296268.4, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048992909491062164, "optim/lr": 1.4806117544397867e-05, "optim/total_tokens": 1969871650816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2789294719696045, "created_at": "2025-06-03T07:39:38.960842+00:00"} {"global_step": 234828, "acc_step": 0, "speed/wps": 5505.8579862254155, "speed/FLOPS": 243330741455271.75, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.45 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.45, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0518842488527298, "optim/lr": 1.4802570319303543e-05, "optim/total_tokens": 1969880039424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2611247301101685, "created_at": "2025-06-03T07:39:41.941094+00:00"} {"global_step": 234829, "acc_step": 0, "speed/wps": 5508.222991978068, "speed/FLOPS": 243435262604342.22, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049370069056749344, "optim/lr": 1.4799023094208996e-05, "optim/total_tokens": 1969888428032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2629328966140747, "created_at": "2025-06-03T07:39:44.919981+00:00"} {"global_step": 234830, "acc_step": 0, "speed/wps": 5527.865370326157, "speed/FLOPS": 244303355188521.28, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.053432807326316833, "optim/lr": 1.479547586911445e-05, "optim/total_tokens": 1969896816640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2819913625717163, "created_at": "2025-06-03T07:39:47.888803+00:00"} {"global_step": 234831, "acc_step": 0, "speed/wps": 5515.336983195068, "speed/FLOPS": 243749664603425.62, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.051313452422618866, "optim/lr": 1.4791928644019904e-05, "optim/total_tokens": 1969905205248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2640656232833862, "created_at": "2025-06-03T07:39:50.864384+00:00"} {"global_step": 234832, "acc_step": 0, "speed/wps": 5532.703973489173, "speed/FLOPS": 244517196682110.5, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05203070491552353, "optim/lr": 1.4788381418925579e-05, "optim/total_tokens": 1969913593856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2683650255203247, "created_at": "2025-06-03T07:39:53.831880+00:00"} {"global_step": 234833, "acc_step": 0, "speed/wps": 5529.469448360989, "speed/FLOPS": 244374247227245.2, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04732602462172508, "optim/lr": 1.4784834193831031e-05, "optim/total_tokens": 1969921982464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2993578910827637, "created_at": "2025-06-03T07:39:56.800305+00:00"} {"global_step": 234834, "acc_step": 0, "speed/wps": 5532.176620527816, "speed/FLOPS": 244493890380455.66, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04535002261400223, "optim/lr": 1.4781286968736485e-05, "optim/total_tokens": 1969930371072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.271074652671814, "created_at": "2025-06-03T07:39:59.766074+00:00"} {"global_step": 234835, "acc_step": 0, "speed/wps": 5525.251517048005, "speed/FLOPS": 244187836252540.84, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04819169268012047, "optim/lr": 1.4777739743641938e-05, "optim/total_tokens": 1969938759680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2875959873199463, "created_at": "2025-06-03T07:40:02.739707+00:00"} {"global_step": 234836, "acc_step": 0, "speed/wps": 5515.816968094508, "speed/FLOPS": 243770877479195.5, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04508689045906067, "optim/lr": 1.4774192518547614e-05, "optim/total_tokens": 1969947148288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2657363414764404, "created_at": "2025-06-03T07:40:05.718095+00:00"} {"global_step": 234837, "acc_step": 0, "speed/wps": 5506.698752881836, "speed/FLOPS": 243367899038051.7, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046557117253541946, "optim/lr": 1.4770645293453067e-05, "optim/total_tokens": 1969955536896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2606182098388672, "created_at": "2025-06-03T07:40:08.698166+00:00"} {"global_step": 234838, "acc_step": 0, "speed/wps": 5520.5710797778565, "speed/FLOPS": 243980984881849.97, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04608535394072533, "optim/lr": 1.476709806835852e-05, "optim/total_tokens": 1969963925504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2735381126403809, "created_at": "2025-06-03T07:40:11.674793+00:00"} {"global_step": 234839, "acc_step": 0, "speed/wps": 5535.905098760984, "speed/FLOPS": 244658670034280.1, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046223413199186325, "optim/lr": 1.4763550843264195e-05, "optim/total_tokens": 1969972314112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.26850426197052, "created_at": "2025-06-03T07:40:14.638880+00:00"} {"global_step": 234840, "acc_step": 0, "speed/wps": 5535.292936143092, "speed/FLOPS": 244631615579901.6, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.03, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04494010657072067, "optim/lr": 1.4760003618169648e-05, "optim/total_tokens": 1969980702720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2488218545913696, "created_at": "2025-06-03T07:40:17.603141+00:00"} {"global_step": 234841, "acc_step": 0, "speed/wps": 5506.5560515110255, "speed/FLOPS": 243361592367873.7, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.44 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.44, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0455181859433651, "optim/lr": 1.4756456393075102e-05, "optim/total_tokens": 1969989091328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2683225870132446, "created_at": "2025-06-03T07:40:20.582502+00:00"} {"global_step": 234842, "acc_step": 0, "speed/wps": 5514.357028311232, "speed/FLOPS": 243706355613423.9, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04584100842475891, "optim/lr": 1.4752909167980556e-05, "optim/total_tokens": 1969997479936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2851207256317139, "created_at": "2025-06-03T07:40:23.558257+00:00"} {"global_step": 234843, "acc_step": 0, "speed/wps": 5509.995532819147, "speed/FLOPS": 243513599836831.4, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04545280709862709, "optim/lr": 1.4749361942886231e-05, "optim/total_tokens": 1970005868544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2775293588638306, "created_at": "2025-06-03T07:40:26.536424+00:00"} {"global_step": 234844, "acc_step": 0, "speed/wps": 5505.754202018029, "speed/FLOPS": 243326154724521.0, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04535713046789169, "optim/lr": 1.4745814717791683e-05, "optim/total_tokens": 1970014257152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2516987323760986, "created_at": "2025-06-03T07:40:29.517283+00:00"} {"global_step": 234845, "acc_step": 0, "speed/wps": 5514.848667258961, "speed/FLOPS": 243728083538477.25, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045566126704216, "optim/lr": 1.4742267492697137e-05, "optim/total_tokens": 1970022645760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2682472467422485, "created_at": "2025-06-03T07:40:32.498818+00:00"} {"global_step": 234846, "acc_step": 0, "speed/wps": 5504.341710675545, "speed/FLOPS": 243263729836969.3, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04554017633199692, "optim/lr": 1.473872026760259e-05, "optim/total_tokens": 1970031034368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.3001312017440796, "created_at": "2025-06-03T07:40:35.480146+00:00"} {"global_step": 234847, "acc_step": 0, "speed/wps": 5507.195485737742, "speed/FLOPS": 243389852087773.5, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045592162758111954, "optim/lr": 1.4735173042508266e-05, "optim/total_tokens": 1970039422976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2761415243148804, "created_at": "2025-06-03T07:40:38.463724+00:00"} {"global_step": 234848, "acc_step": 0, "speed/wps": 5526.664543514478, "speed/FLOPS": 244250284789833.88, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04527567699551582, "optim/lr": 1.473162581741372e-05, "optim/total_tokens": 1970047811584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2616395950317383, "created_at": "2025-06-03T07:40:41.433111+00:00"} {"global_step": 234849, "acc_step": 0, "speed/wps": 5533.102073782815, "speed/FLOPS": 244534790677427.44, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.02, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046958185732364655, "optim/lr": 1.4728078592319171e-05, "optim/total_tokens": 1970056200192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2834984064102173, "created_at": "2025-06-03T07:40:44.398347+00:00"} {"global_step": 234850, "acc_step": 0, "speed/wps": 5521.250813908761, "speed/FLOPS": 244011025651241.28, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04536769911646843, "optim/lr": 1.4724531367224625e-05, "optim/total_tokens": 1970064588800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2604444026947021, "created_at": "2025-06-03T07:40:47.371848+00:00"} {"global_step": 234851, "acc_step": 0, "speed/wps": 5514.977566059955, "speed/FLOPS": 243733780205717.34, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05007292702794075, "optim/lr": 1.47209841421303e-05, "optim/total_tokens": 1970072977408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2518365383148193, "created_at": "2025-06-03T07:40:50.347633+00:00"} {"global_step": 234852, "acc_step": 0, "speed/wps": 5519.669911101645, "speed/FLOPS": 243941157838960.84, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04515762999653816, "optim/lr": 1.4717436917035754e-05, "optim/total_tokens": 1970081366016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2614423036575317, "created_at": "2025-06-03T07:40:53.320757+00:00"} {"global_step": 234853, "acc_step": 0, "speed/wps": 5514.435368171713, "speed/FLOPS": 243709817834277.4, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.052390389144420624, "optim/lr": 1.4713889691941208e-05, "optim/total_tokens": 1970089754624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2631893157958984, "created_at": "2025-06-03T07:40:56.296160+00:00"} {"global_step": 234854, "acc_step": 0, "speed/wps": 5506.117627580087, "speed/FLOPS": 243342216274183.3, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.43 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.43, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0455237440764904, "optim/lr": 1.471034246684666e-05, "optim/total_tokens": 1970098143232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.267305612564087, "created_at": "2025-06-03T07:40:59.276092+00:00"} {"global_step": 234855, "acc_step": 0, "speed/wps": 5514.767305451111, "speed/FLOPS": 243724487763017.75, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04945893958210945, "optim/lr": 1.4706795241752335e-05, "optim/total_tokens": 1970106531840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2544282674789429, "created_at": "2025-06-03T07:41:02.256177+00:00"} {"global_step": 234856, "acc_step": 0, "speed/wps": 5525.145865563913, "speed/FLOPS": 244183166997717.3, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04730217903852463, "optim/lr": 1.4703248016657789e-05, "optim/total_tokens": 1970114920448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2650834321975708, "created_at": "2025-06-03T07:41:05.226006+00:00"} {"global_step": 234857, "acc_step": 0, "speed/wps": 5531.005252857913, "speed/FLOPS": 244442121925049.2, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04883847013115883, "optim/lr": 1.4699700791563242e-05, "optim/total_tokens": 1970123309056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.274691104888916, "created_at": "2025-06-03T07:41:08.192560+00:00"} {"global_step": 234858, "acc_step": 0, "speed/wps": 5531.796524031681, "speed/FLOPS": 244477092060836.72, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047446489334106445, "optim/lr": 1.4696153566468696e-05, "optim/total_tokens": 1970131697664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2707107067108154, "created_at": "2025-06-03T07:41:11.158692+00:00"} {"global_step": 234859, "acc_step": 0, "speed/wps": 5518.182952509589, "speed/FLOPS": 243875441880136.0, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046120885759592056, "optim/lr": 1.469260634137437e-05, "optim/total_tokens": 1970140086272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2610772848129272, "created_at": "2025-06-03T07:41:14.131916+00:00"} {"global_step": 234860, "acc_step": 0, "speed/wps": 5525.620796677158, "speed/FLOPS": 244204156522004.94, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04761781170964241, "optim/lr": 1.4689059116279823e-05, "optim/total_tokens": 1970148474880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2443712949752808, "created_at": "2025-06-03T07:41:17.101912+00:00"} {"global_step": 234861, "acc_step": 0, "speed/wps": 5504.400572365185, "speed/FLOPS": 243266331222369.97, "speed/curr_iter_time": 2.9756, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9756, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046237315982580185, "optim/lr": 1.4685511891185277e-05, "optim/total_tokens": 1970156863488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2863105535507202, "created_at": "2025-06-03T07:41:20.086812+00:00"} {"global_step": 234862, "acc_step": 0, "speed/wps": 5510.205613521755, "speed/FLOPS": 243522884328596.2, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.42 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.42, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04827360063791275, "optim/lr": 1.468196466609073e-05, "optim/total_tokens": 1970165252096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2748416662216187, "created_at": "2025-06-03T07:41:23.064472+00:00"} {"global_step": 234863, "acc_step": 0, "speed/wps": 5510.322897441586, "speed/FLOPS": 243528067677539.2, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048779718577861786, "optim/lr": 1.4678417440996406e-05, "optim/total_tokens": 1970173640704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.267927885055542, "created_at": "2025-06-03T07:41:26.042249+00:00"} {"global_step": 234864, "acc_step": 0, "speed/wps": 5525.016055480224, "speed/FLOPS": 244177430056446.5, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05018515884876251, "optim/lr": 1.4674870215901858e-05, "optim/total_tokens": 1970182029312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.269711971282959, "created_at": "2025-06-03T07:41:29.011998+00:00"} {"global_step": 234865, "acc_step": 0, "speed/wps": 5523.5498625635855, "speed/FLOPS": 244112631834186.75, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04710442200303078, "optim/lr": 1.4671322990807312e-05, "optim/total_tokens": 1970190417920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2799851894378662, "created_at": "2025-06-03T07:41:31.982718+00:00"} {"global_step": 234866, "acc_step": 0, "speed/wps": 5514.741707828276, "speed/FLOPS": 243723356479108.97, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04709123447537422, "optim/lr": 1.4667775765712987e-05, "optim/total_tokens": 1970198806528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.24993896484375, "created_at": "2025-06-03T07:41:34.959203+00:00"} {"global_step": 234867, "acc_step": 0, "speed/wps": 5507.808516919507, "speed/FLOPS": 243416944928229.47, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046320389956235886, "optim/lr": 1.466422854061844e-05, "optim/total_tokens": 1970207195136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.274780035018921, "created_at": "2025-06-03T07:41:37.938311+00:00"} {"global_step": 234868, "acc_step": 0, "speed/wps": 5522.71252433845, "speed/FLOPS": 244075625770521.3, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04568953439593315, "optim/lr": 1.4660681315523894e-05, "optim/total_tokens": 1970215583744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2616583108901978, "created_at": "2025-06-03T07:41:40.911764+00:00"} {"global_step": 234869, "acc_step": 0, "speed/wps": 5517.081990351544, "speed/FLOPS": 243826784987985.6, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04814532399177551, "optim/lr": 1.4657134090429348e-05, "optim/total_tokens": 1970223972352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.266466736793518, "created_at": "2025-06-03T07:41:43.891179+00:00"} {"global_step": 234870, "acc_step": 0, "speed/wps": 5519.192990785116, "speed/FLOPS": 243920080402069.75, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04525207728147507, "optim/lr": 1.4653586865335022e-05, "optim/total_tokens": 1970232360960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2722711563110352, "created_at": "2025-06-03T07:41:46.864766+00:00"} {"global_step": 234871, "acc_step": 0, "speed/wps": 5514.086881827649, "speed/FLOPS": 243694416521584.6, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.41 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.41, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047171201556921005, "optim/lr": 1.4650039640240475e-05, "optim/total_tokens": 1970240749568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.265633225440979, "created_at": "2025-06-03T07:41:49.842866+00:00"} {"global_step": 234872, "acc_step": 0, "speed/wps": 5523.873886157126, "speed/FLOPS": 244126952018518.16, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04724757745862007, "optim/lr": 1.4646492415145929e-05, "optim/total_tokens": 1970249138176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2591841220855713, "created_at": "2025-06-03T07:41:52.814514+00:00"} {"global_step": 234873, "acc_step": 0, "speed/wps": 5531.307255829829, "speed/FLOPS": 244455468910616.53, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0470615029335022, "optim/lr": 1.4642945190051383e-05, "optim/total_tokens": 1970257526784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2570559978485107, "created_at": "2025-06-03T07:41:55.780996+00:00"} {"global_step": 234874, "acc_step": 0, "speed/wps": 5517.010389959251, "speed/FLOPS": 243823620617130.28, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04937854781746864, "optim/lr": 1.4639397964957058e-05, "optim/total_tokens": 1970265915392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2593951225280762, "created_at": "2025-06-03T07:41:58.760151+00:00"} {"global_step": 234875, "acc_step": 0, "speed/wps": 5527.921078478525, "speed/FLOPS": 244305817203715.75, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0466463603079319, "optim/lr": 1.463585073986251e-05, "optim/total_tokens": 1970274304000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2664217948913574, "created_at": "2025-06-03T07:42:01.728348+00:00"} {"global_step": 234876, "acc_step": 0, "speed/wps": 5526.254261530877, "speed/FLOPS": 244232152426172.25, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04667850211262703, "optim/lr": 1.4632303514767964e-05, "optim/total_tokens": 1970282692608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2635374069213867, "created_at": "2025-06-03T07:42:04.701340+00:00"} {"global_step": 234877, "acc_step": 0, "speed/wps": 5533.437179425576, "speed/FLOPS": 244549600631611.3, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046549782156944275, "optim/lr": 1.4628756289673417e-05, "optim/total_tokens": 1970291081216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2820155620574951, "created_at": "2025-06-03T07:42:07.670719+00:00"} {"global_step": 234878, "acc_step": 0, "speed/wps": 5522.472387345328, "speed/FLOPS": 244065012944557.88, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049101490527391434, "optim/lr": 1.4625209064579093e-05, "optim/total_tokens": 1970299469824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2730629444122314, "created_at": "2025-06-03T07:42:10.643445+00:00"} {"global_step": 234879, "acc_step": 0, "speed/wps": 5512.515255135063, "speed/FLOPS": 243624958666086.94, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045469172298908234, "optim/lr": 1.4621661839484546e-05, "optim/total_tokens": 1970307858432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2565813064575195, "created_at": "2025-06-03T07:42:13.621561+00:00"} {"global_step": 234880, "acc_step": 0, "speed/wps": 5521.806829164123, "speed/FLOPS": 244035598679584.22, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05229884386062622, "optim/lr": 1.4618114614389998e-05, "optim/total_tokens": 1970316247040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.268548846244812, "created_at": "2025-06-03T07:42:16.595334+00:00"} {"global_step": 234881, "acc_step": 0, "speed/wps": 5528.249082633894, "speed/FLOPS": 244320313308505.62, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045887235552072525, "optim/lr": 1.4614567389295452e-05, "optim/total_tokens": 1970324635648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2733781337738037, "created_at": "2025-06-03T07:42:19.563253+00:00"} {"global_step": 234882, "acc_step": 0, "speed/wps": 5529.860884745235, "speed/FLOPS": 244391546711875.8, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.26, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05047748237848282, "optim/lr": 1.4611020164201127e-05, "optim/total_tokens": 1970333024256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2725433111190796, "created_at": "2025-06-03T07:42:22.533025+00:00"} {"global_step": 234883, "acc_step": 0, "speed/wps": 5527.643561088668, "speed/FLOPS": 244293552355546.88, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046298179775476456, "optim/lr": 1.4607472939106581e-05, "optim/total_tokens": 1970341412864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2804839611053467, "created_at": "2025-06-03T07:42:25.501314+00:00"} {"global_step": 234884, "acc_step": 0, "speed/wps": 5530.01372983997, "speed/FLOPS": 244398301682731.0, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049398645758628845, "optim/lr": 1.4603925714012035e-05, "optim/total_tokens": 1970349801472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2660906314849854, "created_at": "2025-06-03T07:42:28.472939+00:00"} {"global_step": 234885, "acc_step": 0, "speed/wps": 5516.960619153048, "speed/FLOPS": 243821421002246.2, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04848955199122429, "optim/lr": 1.4600378488917487e-05, "optim/total_tokens": 1970358190080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2748658657073975, "created_at": "2025-06-03T07:42:31.448518+00:00"} {"global_step": 234886, "acc_step": 0, "speed/wps": 5506.16455670323, "speed/FLOPS": 243344290301221.22, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.4 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.4, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05023026838898659, "optim/lr": 1.4596831263823162e-05, "optim/total_tokens": 1970366578688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2763060331344604, "created_at": "2025-06-03T07:42:34.433853+00:00"} {"global_step": 234887, "acc_step": 0, "speed/wps": 5513.22035455687, "speed/FLOPS": 243656120451504.78, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04770520702004433, "optim/lr": 1.4593284038728616e-05, "optim/total_tokens": 1970374967296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2705414295196533, "created_at": "2025-06-03T07:42:37.414103+00:00"} {"global_step": 234888, "acc_step": 0, "speed/wps": 5521.4965032848095, "speed/FLOPS": 244021883864110.38, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04550798237323761, "optim/lr": 1.458973681363407e-05, "optim/total_tokens": 1970383355904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2729705572128296, "created_at": "2025-06-03T07:42:40.386009+00:00"} {"global_step": 234889, "acc_step": 0, "speed/wps": 5532.024268187909, "speed/FLOPS": 244487157186841.72, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.18, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04695790633559227, "optim/lr": 1.4586189588539523e-05, "optim/total_tokens": 1970391744512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2566529512405396, "created_at": "2025-06-03T07:42:43.355036+00:00"} {"global_step": 234890, "acc_step": 0, "speed/wps": 5522.590388215737, "speed/FLOPS": 244070227979046.75, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04745768383145332, "optim/lr": 1.4582642363445198e-05, "optim/total_tokens": 1970400133120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2802783250808716, "created_at": "2025-06-03T07:42:46.326215+00:00"} {"global_step": 234891, "acc_step": 0, "speed/wps": 5529.543571125344, "speed/FLOPS": 244377523074034.97, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04722922667860985, "optim/lr": 1.457909513835065e-05, "optim/total_tokens": 1970408521728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.272430181503296, "created_at": "2025-06-03T07:42:49.294177+00:00"} {"global_step": 234892, "acc_step": 0, "speed/wps": 5533.43841081863, "speed/FLOPS": 244549655052881.44, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04919213429093361, "optim/lr": 1.4575547913256104e-05, "optim/total_tokens": 1970416910336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2674345970153809, "created_at": "2025-06-03T07:42:52.259765+00:00"} {"global_step": 234893, "acc_step": 0, "speed/wps": 5533.649131997247, "speed/FLOPS": 244558967850407.56, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.06, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.050390370190143585, "optim/lr": 1.457200068816178e-05, "optim/total_tokens": 1970425298944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2610342502593994, "created_at": "2025-06-03T07:42:55.225804+00:00"} {"global_step": 234894, "acc_step": 0, "speed/wps": 5538.459356177414, "speed/FLOPS": 244771555138211.62, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.37 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.37, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.052260417491197586, "optim/lr": 1.4568453463067233e-05, "optim/total_tokens": 1970433687552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2840911149978638, "created_at": "2025-06-03T07:42:58.188235+00:00"} {"global_step": 234895, "acc_step": 0, "speed/wps": 5511.904459645552, "speed/FLOPS": 243597964631785.28, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05411483719944954, "optim/lr": 1.4564906237972687e-05, "optim/total_tokens": 1970442076160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2478169202804565, "created_at": "2025-06-03T07:43:01.165398+00:00"} {"global_step": 234896, "acc_step": 0, "speed/wps": 5510.379461215709, "speed/FLOPS": 243530567506835.75, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.39 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.39, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04790322855114937, "optim/lr": 1.4561359012878139e-05, "optim/total_tokens": 1970450464768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.254644751548767, "created_at": "2025-06-03T07:43:04.144220+00:00"} {"global_step": 234897, "acc_step": 0, "speed/wps": 5526.655091513153, "speed/FLOPS": 244249867059755.03, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.057107049971818924, "optim/lr": 1.4557811787783814e-05, "optim/total_tokens": 1970458853376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2798616886138916, "created_at": "2025-06-03T07:43:07.116444+00:00"} {"global_step": 234898, "acc_step": 0, "speed/wps": 5531.612258655295, "speed/FLOPS": 244468948474356.12, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.37 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.37, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045520953834056854, "optim/lr": 1.4554264562689268e-05, "optim/total_tokens": 1970467241984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2570993900299072, "created_at": "2025-06-03T07:43:10.082986+00:00"} {"global_step": 234899, "acc_step": 0, "speed/wps": 5528.741655099346, "speed/FLOPS": 244342082490264.16, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.37 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.37, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05577072873711586, "optim/lr": 1.4550717337594721e-05, "optim/total_tokens": 1970475630592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2679334878921509, "created_at": "2025-06-03T07:43:13.052340+00:00"} {"global_step": 234900, "acc_step": 0, "speed/wps": 5523.683198205363, "speed/FLOPS": 244118524587079.62, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.38 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.38, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04811082035303116, "optim/lr": 1.4547170112500175e-05, "optim/total_tokens": 1970484019200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.26858651638031, "created_at": "2025-06-03T07:43:16.025954+00:00"} {"global_step": 234901, "acc_step": 0, "speed/wps": 249.9177643951383, "speed/FLOPS": 11045085991185.096, "speed/curr_iter_time": 2.8837, "speed/data_load_time": 0.002, "speed/curr_step_time": 2.8837, "speed/est_time_elapsed": "7.84 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 188.16, "speed/est_time_elapsed_days": 7.84, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05296756327152252, "optim/lr": 1.454362288740585e-05, "optim/total_tokens": 1970492407808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2651357650756836, "created_at": "2025-06-03T07:44:21.590066+00:00"} {"global_step": 234902, "acc_step": 0, "speed/wps": 5621.734621654004, "speed/FLOPS": 248451895630828.47, "speed/curr_iter_time": 2.9119, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9119, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 190.0, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.055320095270872116, "optim/lr": 1.4540075662311302e-05, "optim/total_tokens": 1970500796416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2789413928985596, "created_at": "2025-06-03T07:44:24.511315+00:00"} {"global_step": 234903, "acc_step": 0, "speed/wps": 5575.493180550192, "speed/FLOPS": 246408260619191.6, "speed/curr_iter_time": 2.9375, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9375, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 191.67, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048899199813604355, "optim/lr": 1.4536528437216756e-05, "optim/total_tokens": 1970509185024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 356, "loss/out": 1.2705141305923462, "created_at": "2025-06-03T07:44:27.459042+00:00"} {"global_step": 234904, "acc_step": 0, "speed/wps": 5562.043500913724, "speed/FLOPS": 245813853620960.72, "speed/curr_iter_time": 2.9447, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9447, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.14, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05290971323847771, "optim/lr": 1.453298121212221e-05, "optim/total_tokens": 1970517573632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2638684511184692, "created_at": "2025-06-03T07:44:30.413610+00:00"} {"global_step": 234905, "acc_step": 0, "speed/wps": 5548.620838480152, "speed/FLOPS": 245220640644811.3, "speed/curr_iter_time": 2.9518, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9518, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04613516107201576, "optim/lr": 1.4529433987027885e-05, "optim/total_tokens": 1970525962240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2650738954544067, "created_at": "2025-06-03T07:44:33.372304+00:00"} {"global_step": 234906, "acc_step": 0, "speed/wps": 5560.308900283963, "speed/FLOPS": 245737193151616.2, "speed/curr_iter_time": 2.9448, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9448, "speed/est_time_elapsed": "8.01 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.15, "speed/est_time_elapsed_days": 8.01, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04888402670621872, "optim/lr": 1.4525886761933339e-05, "optim/total_tokens": 1970534350848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2667756080627441, "created_at": "2025-06-03T07:44:36.327276+00:00"} {"global_step": 234907, "acc_step": 0, "speed/wps": 5564.470967472501, "speed/FLOPS": 245921135217958.5, "speed/curr_iter_time": 2.9434, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9434, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.06, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04848071560263634, "optim/lr": 1.452233953683879e-05, "optim/total_tokens": 1970542739456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2730222940444946, "created_at": "2025-06-03T07:44:39.279205+00:00"} {"global_step": 234908, "acc_step": 0, "speed/wps": 5544.959786879316, "speed/FLOPS": 245058840903015.2, "speed/curr_iter_time": 2.9538, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9538, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0454525351524353, "optim/lr": 1.4518792311744244e-05, "optim/total_tokens": 1970551128064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2827850580215454, "created_at": "2025-06-03T07:44:42.245196+00:00"} {"global_step": 234909, "acc_step": 0, "speed/wps": 5532.269587729424, "speed/FLOPS": 244497999054917.44, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.13, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05475633963942528, "optim/lr": 1.451524508664992e-05, "optim/total_tokens": 1970559516672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.283191204071045, "created_at": "2025-06-03T07:44:45.212691+00:00"} {"global_step": 234910, "acc_step": 0, "speed/wps": 5550.717337573098, "speed/FLOPS": 245313295173864.4, "speed/curr_iter_time": 2.9507, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9507, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.54, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047985099256038666, "optim/lr": 1.4511697861555373e-05, "optim/total_tokens": 1970567905280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2776992321014404, "created_at": "2025-06-03T07:44:48.172883+00:00"} {"global_step": 234911, "acc_step": 0, "speed/wps": 5530.356578321996, "speed/FLOPS": 244413453830778.9, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05146561190485954, "optim/lr": 1.4508150636460827e-05, "optim/total_tokens": 1970576293888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2518439292907715, "created_at": "2025-06-03T07:44:51.145253+00:00"} {"global_step": 234912, "acc_step": 0, "speed/wps": 5533.598368649355, "speed/FLOPS": 244556724370261.1, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05429777875542641, "optim/lr": 1.4504603411366279e-05, "optim/total_tokens": 1970584682496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2555848360061646, "created_at": "2025-06-03T07:44:54.112679+00:00"} {"global_step": 234913, "acc_step": 0, "speed/wps": 5532.984159701006, "speed/FLOPS": 244529579478550.47, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04483005404472351, "optim/lr": 1.4501056186271954e-05, "optim/total_tokens": 1970593071104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2730755805969238, "created_at": "2025-06-03T07:44:57.078921+00:00"} {"global_step": 234914, "acc_step": 0, "speed/wps": 5528.093441886742, "speed/FLOPS": 244313434784123.06, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05453314259648323, "optim/lr": 1.4497508961177408e-05, "optim/total_tokens": 1970601459712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2697416543960571, "created_at": "2025-06-03T07:45:00.047594+00:00"} {"global_step": 234915, "acc_step": 0, "speed/wps": 5523.537345497161, "speed/FLOPS": 244112078643918.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04753350466489792, "optim/lr": 1.4493961736082862e-05, "optim/total_tokens": 1970609848320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2609421014785767, "created_at": "2025-06-03T07:45:03.018495+00:00"} {"global_step": 234916, "acc_step": 0, "speed/wps": 5537.663293848775, "speed/FLOPS": 244736373257902.16, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.92, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04786151275038719, "optim/lr": 1.4490414510988315e-05, "optim/total_tokens": 1970618236928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.261271357536316, "created_at": "2025-06-03T07:45:05.985826+00:00"} {"global_step": 234917, "acc_step": 0, "speed/wps": 5512.161659487651, "speed/FLOPS": 243609331548337.94, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.37 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.37, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05300317704677582, "optim/lr": 1.4486867285893989e-05, "optim/total_tokens": 1970626625536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2755175828933716, "created_at": "2025-06-03T07:45:08.962815+00:00"} {"global_step": 234918, "acc_step": 0, "speed/wps": 5543.555334960149, "speed/FLOPS": 244996771316824.56, "speed/curr_iter_time": 2.9546, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9546, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.8, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04647945240139961, "optim/lr": 1.4483320060799443e-05, "optim/total_tokens": 1970635014144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2652614116668701, "created_at": "2025-06-03T07:45:11.926855+00:00"} {"global_step": 234919, "acc_step": 0, "speed/wps": 5532.330133434, "speed/FLOPS": 244500674865158.72, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04777785763144493, "optim/lr": 1.4479772835704896e-05, "optim/total_tokens": 1970643402752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2679675817489624, "created_at": "2025-06-03T07:45:14.895840+00:00"} {"global_step": 234920, "acc_step": 0, "speed/wps": 5541.083495624469, "speed/FLOPS": 244887528670208.2, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045820243656635284, "optim/lr": 1.447622561061035e-05, "optim/total_tokens": 1970651791360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2668513059616089, "created_at": "2025-06-03T07:45:17.863260+00:00"} {"global_step": 234921, "acc_step": 0, "speed/wps": 5526.343415817046, "speed/FLOPS": 244236092589287.94, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04559849947690964, "optim/lr": 1.4472678385516025e-05, "optim/total_tokens": 1970660179968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2553471326828003, "created_at": "2025-06-03T07:45:20.832654+00:00"} {"global_step": 234922, "acc_step": 0, "speed/wps": 5528.844071035608, "speed/FLOPS": 244346608750434.66, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.044751521199941635, "optim/lr": 1.4469131160421479e-05, "optim/total_tokens": 1970668568576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2632575035095215, "created_at": "2025-06-03T07:45:23.805377+00:00"} {"global_step": 234923, "acc_step": 0, "speed/wps": 5525.056049752661, "speed/FLOPS": 244179197598579.0, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0454191118478775, "optim/lr": 1.4465583935326931e-05, "optim/total_tokens": 1970676957184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2703101634979248, "created_at": "2025-06-03T07:45:26.775901+00:00"} {"global_step": 234924, "acc_step": 0, "speed/wps": 5513.806958389, "speed/FLOPS": 243682045338374.34, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046135857701301575, "optim/lr": 1.4462036710232606e-05, "optim/total_tokens": 1970685345792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2635194063186646, "created_at": "2025-06-03T07:45:29.755725+00:00"} {"global_step": 234925, "acc_step": 0, "speed/wps": 5518.876465237814, "speed/FLOPS": 243906091593003.62, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04954329505562782, "optim/lr": 1.445848948513806e-05, "optim/total_tokens": 1970693734400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2780934572219849, "created_at": "2025-06-03T07:45:32.732069+00:00"} {"global_step": 234926, "acc_step": 0, "speed/wps": 5504.95842567662, "speed/FLOPS": 243290985483383.28, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.37 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.37, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049060553312301636, "optim/lr": 1.4454942260043514e-05, "optim/total_tokens": 1970702123008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2552860975265503, "created_at": "2025-06-03T07:45:35.716927+00:00"} {"global_step": 234927, "acc_step": 0, "speed/wps": 5515.34852031786, "speed/FLOPS": 243750174485200.7, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046184077858924866, "optim/lr": 1.4451395034948967e-05, "optim/total_tokens": 1970710511616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2774053812026978, "created_at": "2025-06-03T07:45:38.692299+00:00"} {"global_step": 234928, "acc_step": 0, "speed/wps": 5527.054600018523, "speed/FLOPS": 244267523290822.5, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04637168347835541, "optim/lr": 1.4447847809854641e-05, "optim/total_tokens": 1970718900224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2700132131576538, "created_at": "2025-06-03T07:45:41.662776+00:00"} {"global_step": 234929, "acc_step": 0, "speed/wps": 5525.251958257949, "speed/FLOPS": 244187855751762.06, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04756719991564751, "optim/lr": 1.4444300584760095e-05, "optim/total_tokens": 1970727288832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2686160802841187, "created_at": "2025-06-03T07:45:44.632330+00:00"} {"global_step": 234930, "acc_step": 0, "speed/wps": 5521.1599169456695, "speed/FLOPS": 244007008470725.47, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04777706041932106, "optim/lr": 1.4440753359665548e-05, "optim/total_tokens": 1970735677440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.271413803100586, "created_at": "2025-06-03T07:45:47.604315+00:00"} {"global_step": 234931, "acc_step": 0, "speed/wps": 5522.118989600646, "speed/FLOPS": 244049394573096.56, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045985471457242966, "optim/lr": 1.4437206134571002e-05, "optim/total_tokens": 1970744066048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2609996795654297, "created_at": "2025-06-03T07:45:50.576218+00:00"} {"global_step": 234932, "acc_step": 0, "speed/wps": 5522.176257330089, "speed/FLOPS": 244051925513615.16, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05161024630069733, "optim/lr": 1.4433658909476677e-05, "optim/total_tokens": 1970752454656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.278249740600586, "created_at": "2025-06-03T07:45:53.551243+00:00"} {"global_step": 234933, "acc_step": 0, "speed/wps": 5513.955389938716, "speed/FLOPS": 243688605253130.22, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04619832709431648, "optim/lr": 1.443011168438213e-05, "optim/total_tokens": 1970760843264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2646632194519043, "created_at": "2025-06-03T07:45:56.527223+00:00"} {"global_step": 234934, "acc_step": 0, "speed/wps": 5518.303345833879, "speed/FLOPS": 243880762648840.72, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046845026314258575, "optim/lr": 1.4426564459287583e-05, "optim/total_tokens": 1970769231872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2730637788772583, "created_at": "2025-06-03T07:45:59.501068+00:00"} {"global_step": 234935, "acc_step": 0, "speed/wps": 5511.5955479496015, "speed/FLOPS": 243584312315977.66, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.36 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.36, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0465116985142231, "optim/lr": 1.4423017234193037e-05, "optim/total_tokens": 1970777620480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2676053047180176, "created_at": "2025-06-03T07:46:02.478033+00:00"} {"global_step": 234936, "acc_step": 0, "speed/wps": 5512.208278041645, "speed/FLOPS": 243611391849809.06, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04766222834587097, "optim/lr": 1.4419470009098712e-05, "optim/total_tokens": 1970786009088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2743728160858154, "created_at": "2025-06-03T07:46:05.458069+00:00"} {"global_step": 234937, "acc_step": 0, "speed/wps": 5525.3819269378255, "speed/FLOPS": 244193599702172.6, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04949837923049927, "optim/lr": 1.4415922784004166e-05, "optim/total_tokens": 1970794397696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.253528356552124, "created_at": "2025-06-03T07:46:08.427948+00:00"} {"global_step": 234938, "acc_step": 0, "speed/wps": 5536.391327540302, "speed/FLOPS": 244680158857581.4, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04726458340883255, "optim/lr": 1.4412375558909618e-05, "optim/total_tokens": 1970802786304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2825337648391724, "created_at": "2025-06-03T07:46:11.396206+00:00"} {"global_step": 234939, "acc_step": 0, "speed/wps": 5518.812291392025, "speed/FLOPS": 243903255437491.25, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04884079471230507, "optim/lr": 1.4408828333815071e-05, "optim/total_tokens": 1970811174912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2711906433105469, "created_at": "2025-06-03T07:46:14.373208+00:00"} {"global_step": 234940, "acc_step": 0, "speed/wps": 5516.589975636122, "speed/FLOPS": 243805040455923.56, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0459064245223999, "optim/lr": 1.4405281108720747e-05, "optim/total_tokens": 1970819563520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2656407356262207, "created_at": "2025-06-03T07:46:17.352499+00:00"} {"global_step": 234941, "acc_step": 0, "speed/wps": 5520.31341244686, "speed/FLOPS": 243969597304680.88, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.35 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.35, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048925142735242844, "optim/lr": 1.44017338836262e-05, "optim/total_tokens": 1970827952128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.270387887954712, "created_at": "2025-06-03T07:46:20.329649+00:00"} {"global_step": 234942, "acc_step": 0, "speed/wps": 5529.489839830996, "speed/FLOPS": 244375148425846.5, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.31, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04633669555187225, "optim/lr": 1.4398186658531654e-05, "optim/total_tokens": 1970836340736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2582319974899292, "created_at": "2025-06-03T07:46:23.301304+00:00"} {"global_step": 234943, "acc_step": 0, "speed/wps": 5531.87407513167, "speed/FLOPS": 244480519422513.72, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049226973205804825, "optim/lr": 1.4394639433437106e-05, "optim/total_tokens": 1970844729344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.284143328666687, "created_at": "2025-06-03T07:46:26.271877+00:00"} {"global_step": 234944, "acc_step": 0, "speed/wps": 5524.680958372845, "speed/FLOPS": 244162620479482.84, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04638592153787613, "optim/lr": 1.4391092208342781e-05, "optim/total_tokens": 1970853117952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2727378606796265, "created_at": "2025-06-03T07:46:29.242675+00:00"} {"global_step": 234945, "acc_step": 0, "speed/wps": 5523.426862192458, "speed/FLOPS": 244107195847355.9, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045996394008398056, "optim/lr": 1.4387544983248235e-05, "optim/total_tokens": 1970861506560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2696367502212524, "created_at": "2025-06-03T07:46:32.214027+00:00"} {"global_step": 234946, "acc_step": 0, "speed/wps": 5525.91795627023, "speed/FLOPS": 244217289455018.06, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04729046672582626, "optim/lr": 1.4383997758153689e-05, "optim/total_tokens": 1970869895168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2810343503952026, "created_at": "2025-06-03T07:46:35.184251+00:00"} {"global_step": 234947, "acc_step": 0, "speed/wps": 5515.043969684649, "speed/FLOPS": 243736714906044.22, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045260779559612274, "optim/lr": 1.4380450533059142e-05, "optim/total_tokens": 1970878283776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2723888158798218, "created_at": "2025-06-03T07:46:38.163988+00:00"} {"global_step": 234948, "acc_step": 0, "speed/wps": 5523.472485282815, "speed/FLOPS": 244109212154429.5, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04672975093126297, "optim/lr": 1.4376903307964818e-05, "optim/total_tokens": 1970886672384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2484503984451294, "created_at": "2025-06-03T07:46:41.137887+00:00"} {"global_step": 234949, "acc_step": 0, "speed/wps": 5510.405961631381, "speed/FLOPS": 243531738689567.03, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.051680371165275574, "optim/lr": 1.437335608287027e-05, "optim/total_tokens": 1970895060992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2484800815582275, "created_at": "2025-06-03T07:46:44.118182+00:00"} {"global_step": 234950, "acc_step": 0, "speed/wps": 5517.208123021236, "speed/FLOPS": 243832359406380.44, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04588894546031952, "optim/lr": 1.4369808857775723e-05, "optim/total_tokens": 1970903449600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.282423496246338, "created_at": "2025-06-03T07:46:47.097198+00:00"} {"global_step": 234951, "acc_step": 0, "speed/wps": 5509.674458385673, "speed/FLOPS": 243499409990279.75, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04648489132523537, "optim/lr": 1.4366261632681399e-05, "optim/total_tokens": 1970911838208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2640677690505981, "created_at": "2025-06-03T07:46:50.078136+00:00"} {"global_step": 234952, "acc_step": 0, "speed/wps": 5522.953732523719, "speed/FLOPS": 244086285937694.78, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04572364315390587, "optim/lr": 1.4362714407586852e-05, "optim/total_tokens": 1970920226816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2622665166854858, "created_at": "2025-06-03T07:46:53.048867+00:00"} {"global_step": 234953, "acc_step": 0, "speed/wps": 5538.947785570328, "speed/FLOPS": 244793141217370.2, "speed/curr_iter_time": 2.9557, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9557, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04644204303622246, "optim/lr": 1.4359167182492306e-05, "optim/total_tokens": 1970928615424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2760593891143799, "created_at": "2025-06-03T07:46:56.015068+00:00"} {"global_step": 234954, "acc_step": 0, "speed/wps": 5535.535193572217, "speed/FLOPS": 244642322118282.97, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04597436264157295, "optim/lr": 1.4355619957397758e-05, "optim/total_tokens": 1970937004032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.281150221824646, "created_at": "2025-06-03T07:46:58.982188+00:00"} {"global_step": 234955, "acc_step": 0, "speed/wps": 5524.43284908734, "speed/FLOPS": 244151655319001.97, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0469406396150589, "optim/lr": 1.4352072732303433e-05, "optim/total_tokens": 1970945392640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2569507360458374, "created_at": "2025-06-03T07:47:01.958273+00:00"} {"global_step": 234956, "acc_step": 0, "speed/wps": 5523.87174408303, "speed/FLOPS": 244126857349807.22, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04579197242856026, "optim/lr": 1.4348525507208887e-05, "optim/total_tokens": 1970953781248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2705843448638916, "created_at": "2025-06-03T07:47:04.929647+00:00"} {"global_step": 234957, "acc_step": 0, "speed/wps": 5505.204378745094, "speed/FLOPS": 243301855350107.9, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04786960408091545, "optim/lr": 1.434497828211434e-05, "optim/total_tokens": 1970962169856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.271783471107483, "created_at": "2025-06-03T07:47:07.910744+00:00"} {"global_step": 234958, "acc_step": 0, "speed/wps": 5513.371098831054, "speed/FLOPS": 243662782576844.6, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046390727162361145, "optim/lr": 1.4341431057019794e-05, "optim/total_tokens": 1970970558464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2657694816589355, "created_at": "2025-06-03T07:47:10.890761+00:00"} {"global_step": 234959, "acc_step": 0, "speed/wps": 5506.229382034238, "speed/FLOPS": 243347155249045.66, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.34 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.34, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04647209495306015, "optim/lr": 1.433788383192547e-05, "optim/total_tokens": 1970978947072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2799066305160522, "created_at": "2025-06-03T07:47:13.871185+00:00"} {"global_step": 234960, "acc_step": 0, "speed/wps": 5512.893077046377, "speed/FLOPS": 243641656460699.12, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04798088222742081, "optim/lr": 1.4334336606830922e-05, "optim/total_tokens": 1970987335680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2890291213989258, "created_at": "2025-06-03T07:47:16.850806+00:00"} {"global_step": 234961, "acc_step": 0, "speed/wps": 5519.226516542501, "speed/FLOPS": 243921562068945.75, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04535454139113426, "optim/lr": 1.4330789381736375e-05, "optim/total_tokens": 1970995724288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2665705680847168, "created_at": "2025-06-03T07:47:19.827699+00:00"} {"global_step": 234962, "acc_step": 0, "speed/wps": 5524.800888900662, "speed/FLOPS": 244167920794952.28, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.050771500915288925, "optim/lr": 1.4327242156641829e-05, "optim/total_tokens": 1971004112896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2675025463104248, "created_at": "2025-06-03T07:47:22.801458+00:00"} {"global_step": 234963, "acc_step": 0, "speed/wps": 5522.867888242273, "speed/FLOPS": 244082492059845.72, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045825473964214325, "optim/lr": 1.4323694931547504e-05, "optim/total_tokens": 1971012501504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2665287256240845, "created_at": "2025-06-03T07:47:25.776309+00:00"} {"global_step": 234964, "acc_step": 0, "speed/wps": 5520.101604627969, "speed/FLOPS": 243960236483216.6, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04712928831577301, "optim/lr": 1.4320147706452958e-05, "optim/total_tokens": 1971020890112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2659912109375, "created_at": "2025-06-03T07:47:28.751819+00:00"} {"global_step": 234965, "acc_step": 0, "speed/wps": 5520.942505796637, "speed/FLOPS": 243997400010749.38, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046019356697797775, "optim/lr": 1.431660048135841e-05, "optim/total_tokens": 1971029278720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2586863040924072, "created_at": "2025-06-03T07:47:31.724948+00:00"} {"global_step": 234966, "acc_step": 0, "speed/wps": 5518.088208044161, "speed/FLOPS": 243871254659710.2, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046514373272657394, "optim/lr": 1.4313053256263864e-05, "optim/total_tokens": 1971037667328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2883505821228027, "created_at": "2025-06-03T07:47:34.698816+00:00"} {"global_step": 234967, "acc_step": 0, "speed/wps": 5507.510372767256, "speed/FLOPS": 243403768482740.06, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04856071621179581, "optim/lr": 1.4309506031169539e-05, "optim/total_tokens": 1971046055936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2538259029388428, "created_at": "2025-06-03T07:47:37.682001+00:00"} {"global_step": 234968, "acc_step": 0, "speed/wps": 5503.004876391375, "speed/FLOPS": 243204648604147.12, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04642574116587639, "optim/lr": 1.4305958806074993e-05, "optim/total_tokens": 1971054444544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2765884399414062, "created_at": "2025-06-03T07:47:40.663573+00:00"} {"global_step": 234969, "acc_step": 0, "speed/wps": 5504.989178405809, "speed/FLOPS": 243292344596606.7, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045867450535297394, "optim/lr": 1.4302411580980446e-05, "optim/total_tokens": 1971062833152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.264649748802185, "created_at": "2025-06-03T07:47:43.647137+00:00"} {"global_step": 234970, "acc_step": 0, "speed/wps": 5515.431303366978, "speed/FLOPS": 243753833072249.66, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045262232422828674, "optim/lr": 1.4298864355885898e-05, "optim/total_tokens": 1971071221760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2701373100280762, "created_at": "2025-06-03T07:47:46.626031+00:00"} {"global_step": 234971, "acc_step": 0, "speed/wps": 5519.213611716135, "speed/FLOPS": 243920991741673.3, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047036636620759964, "optim/lr": 1.4295317130791574e-05, "optim/total_tokens": 1971079610368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2795686721801758, "created_at": "2025-06-03T07:47:49.603121+00:00"} {"global_step": 234972, "acc_step": 0, "speed/wps": 5512.440196848016, "speed/FLOPS": 243621641473982.6, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04607759788632393, "optim/lr": 1.4291769905697027e-05, "optim/total_tokens": 1971087998976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.276139259338379, "created_at": "2025-06-03T07:47:52.582246+00:00"} {"global_step": 234973, "acc_step": 0, "speed/wps": 5527.780925237841, "speed/FLOPS": 244299623147846.84, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0457950234413147, "optim/lr": 1.4288222680602481e-05, "optim/total_tokens": 1971096387584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2532204389572144, "created_at": "2025-06-03T07:47:55.554315+00:00"} {"global_step": 234974, "acc_step": 0, "speed/wps": 5529.730055638465, "speed/FLOPS": 244385764735000.66, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04513523355126381, "optim/lr": 1.4284675455507935e-05, "optim/total_tokens": 1971104776192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2509865760803223, "created_at": "2025-06-03T07:47:58.525694+00:00"} {"global_step": 234975, "acc_step": 0, "speed/wps": 5510.1705831383015, "speed/FLOPS": 243521336164949.28, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047550883144140244, "optim/lr": 1.4281128230413608e-05, "optim/total_tokens": 1971113164800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2728664875030518, "created_at": "2025-06-03T07:48:01.504576+00:00"} {"global_step": 234976, "acc_step": 0, "speed/wps": 5499.586868590298, "speed/FLOPS": 243053590154289.4, "speed/curr_iter_time": 2.9783, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9783, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04557674005627632, "optim/lr": 1.4277581005319062e-05, "optim/total_tokens": 1971121553408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.278376817703247, "created_at": "2025-06-03T07:48:04.493615+00:00"} {"global_step": 234977, "acc_step": 0, "speed/wps": 5498.421454623874, "speed/FLOPS": 243002084822102.9, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.33 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.33, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046921443194150925, "optim/lr": 1.4274033780224516e-05, "optim/total_tokens": 1971129942016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2793428897857666, "created_at": "2025-06-03T07:48:07.478316+00:00"} {"global_step": 234978, "acc_step": 0, "speed/wps": 5513.337239851551, "speed/FLOPS": 243661286183256.53, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04727117344737053, "optim/lr": 1.4270486555130191e-05, "optim/total_tokens": 1971138330624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.264628529548645, "created_at": "2025-06-03T07:48:10.454561+00:00"} {"global_step": 234979, "acc_step": 0, "speed/wps": 5512.443274036099, "speed/FLOPS": 243621777469945.38, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04682743176817894, "optim/lr": 1.4266939330035645e-05, "optim/total_tokens": 1971146719232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2673039436340332, "created_at": "2025-06-03T07:48:13.434161+00:00"} {"global_step": 234980, "acc_step": 0, "speed/wps": 5530.1840324720715, "speed/FLOPS": 244405828187381.97, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.23, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04518584534525871, "optim/lr": 1.4263392104941098e-05, "optim/total_tokens": 1971155107840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2683467864990234, "created_at": "2025-06-03T07:48:16.401985+00:00"} {"global_step": 234981, "acc_step": 0, "speed/wps": 5512.420904692965, "speed/FLOPS": 243620788859475.56, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04661345109343529, "optim/lr": 1.425984487984655e-05, "optim/total_tokens": 1971163496448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.265083909034729, "created_at": "2025-06-03T07:48:19.381357+00:00"} {"global_step": 234982, "acc_step": 0, "speed/wps": 5526.687719632144, "speed/FLOPS": 244251309055608.6, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04676947742700577, "optim/lr": 1.4256297654752226e-05, "optim/total_tokens": 1971171885056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2585724592208862, "created_at": "2025-06-03T07:48:22.355251+00:00"} {"global_step": 234983, "acc_step": 0, "speed/wps": 5516.82099647754, "speed/FLOPS": 243815250394642.34, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0502665750682354, "optim/lr": 1.425275042965768e-05, "optim/total_tokens": 1971180273664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.25748610496521, "created_at": "2025-06-03T07:48:25.329493+00:00"} {"global_step": 234984, "acc_step": 0, "speed/wps": 5506.948885408592, "speed/FLOPS": 243378953615439.97, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04604216292500496, "optim/lr": 1.4249203204563133e-05, "optim/total_tokens": 1971188662272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.274845838546753, "created_at": "2025-06-03T07:48:28.312358+00:00"} {"global_step": 234985, "acc_step": 0, "speed/wps": 5508.621354908272, "speed/FLOPS": 243452868206850.9, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.32 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.32, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04717453941702843, "optim/lr": 1.4245655979468587e-05, "optim/total_tokens": 1971197050880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2687581777572632, "created_at": "2025-06-03T07:48:31.294692+00:00"} {"global_step": 234986, "acc_step": 0, "speed/wps": 5530.056163273038, "speed/FLOPS": 244400177023278.6, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04679626226425171, "optim/lr": 1.424210875437426e-05, "optim/total_tokens": 1971205439488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2553647756576538, "created_at": "2025-06-03T07:48:34.266048+00:00"} {"global_step": 234987, "acc_step": 0, "speed/wps": 5525.250959570448, "speed/FLOPS": 244187811614886.25, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04971285164356232, "optim/lr": 1.4238561529279714e-05, "optim/total_tokens": 1971213828096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2800954580307007, "created_at": "2025-06-03T07:48:37.236015+00:00"} {"global_step": 234988, "acc_step": 0, "speed/wps": 5528.833859635619, "speed/FLOPS": 244346157458821.8, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04893997311592102, "optim/lr": 1.4235014304185168e-05, "optim/total_tokens": 1971222216704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2601938247680664, "created_at": "2025-06-03T07:48:40.204162+00:00"} {"global_step": 234989, "acc_step": 0, "speed/wps": 5519.693315646202, "speed/FLOPS": 243942192200034.94, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.056178782135248184, "optim/lr": 1.4231467079090621e-05, "optim/total_tokens": 1971230605312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2679258584976196, "created_at": "2025-06-03T07:48:43.177332+00:00"} {"global_step": 234990, "acc_step": 0, "speed/wps": 5521.99340447411, "speed/FLOPS": 244043844353306.62, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04640182480216026, "optim/lr": 1.4227919853996297e-05, "optim/total_tokens": 1971238993920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.270948886871338, "created_at": "2025-06-03T07:48:46.150912+00:00"} {"global_step": 234991, "acc_step": 0, "speed/wps": 5519.842211072689, "speed/FLOPS": 243948772615769.78, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05669911950826645, "optim/lr": 1.4224372628901749e-05, "optim/total_tokens": 1971247382528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2743226289749146, "created_at": "2025-06-03T07:48:49.123952+00:00"} {"global_step": 234992, "acc_step": 0, "speed/wps": 5510.969899150366, "speed/FLOPS": 243556661841412.28, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046575672924518585, "optim/lr": 1.4220825403807202e-05, "optim/total_tokens": 1971255771136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2642399072647095, "created_at": "2025-06-03T07:48:52.104038+00:00"} {"global_step": 234993, "acc_step": 0, "speed/wps": 5518.096189834374, "speed/FLOPS": 243871607413983.12, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05052398145198822, "optim/lr": 1.4217278178712656e-05, "optim/total_tokens": 1971264159744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2588437795639038, "created_at": "2025-06-03T07:48:55.082735+00:00"} {"global_step": 234994, "acc_step": 0, "speed/wps": 5510.301402243317, "speed/FLOPS": 243527117699798.1, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.31 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.31, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05176307633519173, "optim/lr": 1.4213730953618331e-05, "optim/total_tokens": 1971272548352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2530252933502197, "created_at": "2025-06-03T07:48:58.060509+00:00"} {"global_step": 234995, "acc_step": 0, "speed/wps": 5527.574341429841, "speed/FLOPS": 244290493200925.06, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0533478707075119, "optim/lr": 1.4210183728523785e-05, "optim/total_tokens": 1971280936960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2688654661178589, "created_at": "2025-06-03T07:49:01.035195+00:00"} {"global_step": 234996, "acc_step": 0, "speed/wps": 5519.96467556045, "speed/FLOPS": 243954184919298.75, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05251799523830414, "optim/lr": 1.4206636503429237e-05, "optim/total_tokens": 1971289325568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.266755223274231, "created_at": "2025-06-03T07:49:04.010129+00:00"} {"global_step": 234997, "acc_step": 0, "speed/wps": 5510.28750052802, "speed/FLOPS": 243526503315137.4, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0466315895318985, "optim/lr": 1.420308927833469e-05, "optim/total_tokens": 1971297714176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.274522066116333, "created_at": "2025-06-03T07:49:06.988059+00:00"} {"global_step": 234998, "acc_step": 0, "speed/wps": 5519.232486522342, "speed/FLOPS": 243921825911497.62, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05713250860571861, "optim/lr": 1.4199542053240366e-05, "optim/total_tokens": 1971306102784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2789392471313477, "created_at": "2025-06-03T07:49:09.960922+00:00"} {"global_step": 234999, "acc_step": 0, "speed/wps": 5513.910033241992, "speed/FLOPS": 243686600719291.66, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04760238528251648, "optim/lr": 1.419599482814582e-05, "optim/total_tokens": 1971314491392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2825361490249634, "created_at": "2025-06-03T07:49:12.939301+00:00"} {"global_step": 235000, "acc_step": 0, "speed/wps": 5513.536878756799, "speed/FLOPS": 243670109201023.9, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.3 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.3, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.06186554580926895, "optim/lr": 1.4192447603051273e-05, "optim/total_tokens": 1971322880000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2559627294540405, "created_at": "2025-06-03T07:49:15.919518+00:00"} {"global_step": 235001, "acc_step": 0, "speed/wps": 223.75133048379388, "speed/FLOPS": 9888663544253.656, "speed/curr_iter_time": 4.6701, "speed/data_load_time": 4.5197, "speed/curr_step_time": 4.6701, "speed/est_time_elapsed": "12.7 days", "speed/est_time_remaining": "5.19 hours", "speed/est_time_elapsed_hrs": 304.86, "speed/est_time_elapsed_days": 12.7, "speed/est_time_remaining_hrs": 5.19, "speed/est_time_remaining_days": 0.22, "optim/grad_norm": 0.05647760257124901, "optim/lr": 1.4188900377956727e-05, "optim/total_tokens": 1971331268608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2732744216918945, "created_at": "2025-06-03T07:50:29.150928+00:00"} {"global_step": 235002, "acc_step": 0, "speed/wps": 5629.311390467138, "speed/FLOPS": 248786750030950.62, "speed/curr_iter_time": 2.9071, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9071, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 189.77, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.055713802576065063, "optim/lr": 1.41853531528624e-05, "optim/total_tokens": 1971339657216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2715429067611694, "created_at": "2025-06-03T07:50:32.069770+00:00"} {"global_step": 235003, "acc_step": 0, "speed/wps": 5589.196713988863, "speed/FLOPS": 247013886656138.28, "speed/curr_iter_time": 2.9287, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9287, "speed/est_time_elapsed": "7.97 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 191.18, "speed/est_time_elapsed_days": 7.97, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.06730809062719345, "optim/lr": 1.4181805927767854e-05, "optim/total_tokens": 1971348045824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2690742015838623, "created_at": "2025-06-03T07:50:35.007689+00:00"} {"global_step": 235004, "acc_step": 0, "speed/wps": 5573.478695376429, "speed/FLOPS": 246319230685581.1, "speed/curr_iter_time": 2.9386, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9386, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 191.83, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04555041715502739, "optim/lr": 1.4178258702673308e-05, "optim/total_tokens": 1971356434432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2740648984909058, "created_at": "2025-06-03T07:50:37.955096+00:00"} {"global_step": 235005, "acc_step": 0, "speed/wps": 5555.999429773584, "speed/FLOPS": 245546736612927.1, "speed/curr_iter_time": 2.9478, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9478, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.43, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05434029549360275, "optim/lr": 1.4174711477578983e-05, "optim/total_tokens": 1971364823040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2781476974487305, "created_at": "2025-06-03T07:50:40.911779+00:00"} {"global_step": 235006, "acc_step": 0, "speed/wps": 5555.0510046251575, "speed/FLOPS": 245504821075846.62, "speed/curr_iter_time": 2.9484, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9484, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.47, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05910031124949455, "optim/lr": 1.4171164252484437e-05, "optim/total_tokens": 1971373211648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.259415626525879, "created_at": "2025-06-03T07:50:43.869945+00:00"} {"global_step": 235007, "acc_step": 0, "speed/wps": 5547.884625676334, "speed/FLOPS": 245188103807161.28, "speed/curr_iter_time": 2.9509, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9509, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.63, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04607207328081131, "optim/lr": 1.4167617027389889e-05, "optim/total_tokens": 1971381600256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2674885988235474, "created_at": "2025-06-03T07:50:46.832609+00:00"} {"global_step": 235008, "acc_step": 0, "speed/wps": 5537.653654278855, "speed/FLOPS": 244735947238251.5, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.058184053748846054, "optim/lr": 1.4164069802295343e-05, "optim/total_tokens": 1971389988864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2737147808074951, "created_at": "2025-06-03T07:50:49.800366+00:00"} {"global_step": 235009, "acc_step": 0, "speed/wps": 5516.557144878702, "speed/FLOPS": 243803589504488.62, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.29 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.29, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05381510779261589, "optim/lr": 1.4160522577201018e-05, "optim/total_tokens": 1971398377472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2587734460830688, "created_at": "2025-06-03T07:50:52.775603+00:00"} {"global_step": 235010, "acc_step": 0, "speed/wps": 5537.657289159755, "speed/FLOPS": 244736107881382.28, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05132145807147026, "optim/lr": 1.4156975352106472e-05, "optim/total_tokens": 1971406766080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.272338628768921, "created_at": "2025-06-03T07:50:55.740107+00:00"} {"global_step": 235011, "acc_step": 0, "speed/wps": 5520.110403304769, "speed/FLOPS": 243960625339695.44, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.29 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.29, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05723699554800987, "optim/lr": 1.4153428127011925e-05, "optim/total_tokens": 1971415154688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2466940879821777, "created_at": "2025-06-03T07:50:58.716488+00:00"} {"global_step": 235012, "acc_step": 0, "speed/wps": 5540.798735664328, "speed/FLOPS": 244874943737503.56, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.98, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04722823575139046, "optim/lr": 1.4149880901917377e-05, "optim/total_tokens": 1971423543296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.28163743019104, "created_at": "2025-06-03T07:51:01.679014+00:00"} {"global_step": 235013, "acc_step": 0, "speed/wps": 5541.057010418291, "speed/FLOPS": 244886358159658.7, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05174832046031952, "optim/lr": 1.4146333676823053e-05, "optim/total_tokens": 1971431931904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2567260265350342, "created_at": "2025-06-03T07:51:04.641175+00:00"} {"global_step": 235014, "acc_step": 0, "speed/wps": 5540.501174026066, "speed/FLOPS": 244861793036150.9, "speed/curr_iter_time": 2.9547, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9547, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05198254808783531, "optim/lr": 1.4142786451728506e-05, "optim/total_tokens": 1971440320512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.277115821838379, "created_at": "2025-06-03T07:51:07.603288+00:00"} {"global_step": 235015, "acc_step": 0, "speed/wps": 5535.596208787595, "speed/FLOPS": 244645018678498.5, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 193.16, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046911127865314484, "optim/lr": 1.413923922663396e-05, "optim/total_tokens": 1971448709120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.267337679862976, "created_at": "2025-06-03T07:51:10.568423+00:00"} {"global_step": 235016, "acc_step": 0, "speed/wps": 5541.342489002162, "speed/FLOPS": 244898974851853.94, "speed/curr_iter_time": 2.9558, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9558, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05111865699291229, "optim/lr": 1.4135692001539414e-05, "optim/total_tokens": 1971457097728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2847070693969727, "created_at": "2025-06-03T07:51:13.533522+00:00"} {"global_step": 235017, "acc_step": 0, "speed/wps": 5535.058211015655, "speed/FLOPS": 244621241930700.94, "speed/curr_iter_time": 2.958, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.958, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.11, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046936482191085815, "optim/lr": 1.4132144776445089e-05, "optim/total_tokens": 1971465486336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2703523635864258, "created_at": "2025-06-03T07:51:16.502641+00:00"} {"global_step": 235018, "acc_step": 0, "speed/wps": 5541.607005750356, "speed/FLOPS": 244910665138204.66, "speed/curr_iter_time": 2.9557, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9557, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04944337159395218, "optim/lr": 1.4128597551350541e-05, "optim/total_tokens": 1971473874944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2610702514648438, "created_at": "2025-06-03T07:51:19.464840+00:00"} {"global_step": 235019, "acc_step": 0, "speed/wps": 5505.519349112083, "speed/FLOPS": 243315775428164.3, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.29 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.29, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047580115497112274, "optim/lr": 1.4125050326255995e-05, "optim/total_tokens": 1971482263552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2898266315460205, "created_at": "2025-06-03T07:51:22.449498+00:00"} {"global_step": 235020, "acc_step": 0, "speed/wps": 5516.564875731369, "speed/FLOPS": 243803931168606.44, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04577269405126572, "optim/lr": 1.4121503101161448e-05, "optim/total_tokens": 1971490652160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2707711458206177, "created_at": "2025-06-03T07:51:25.428429+00:00"} {"global_step": 235021, "acc_step": 0, "speed/wps": 5534.452787511245, "speed/FLOPS": 244594485310644.47, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.21, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049381323158741, "optim/lr": 1.4117955876067124e-05, "optim/total_tokens": 1971499040768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2968990802764893, "created_at": "2025-06-03T07:51:28.395153+00:00"} {"global_step": 235022, "acc_step": 0, "speed/wps": 5543.78411084158, "speed/FLOPS": 245006882039802.72, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 192.88, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04796351119875908, "optim/lr": 1.4114408650972577e-05, "optim/total_tokens": 1971507429376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2719581127166748, "created_at": "2025-06-03T07:51:31.358758+00:00"} {"global_step": 235023, "acc_step": 0, "speed/wps": 5536.466661394999, "speed/FLOPS": 244683488228365.44, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.14, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04642985761165619, "optim/lr": 1.411086142587803e-05, "optim/total_tokens": 1971515817984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2710106372833252, "created_at": "2025-06-03T07:51:34.323542+00:00"} {"global_step": 235024, "acc_step": 0, "speed/wps": 5535.28252108309, "speed/FLOPS": 244631155287558.56, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.1, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04859232157468796, "optim/lr": 1.4107314200783483e-05, "optim/total_tokens": 1971524206592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2681233882904053, "created_at": "2025-06-03T07:51:37.288666+00:00"} {"global_step": 235025, "acc_step": 0, "speed/wps": 5520.601510419737, "speed/FLOPS": 243982329760462.94, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.28 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.28, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04744012653827667, "optim/lr": 1.4103766975689158e-05, "optim/total_tokens": 1971532595200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2646610736846924, "created_at": "2025-06-03T07:51:40.261785+00:00"} {"global_step": 235026, "acc_step": 0, "speed/wps": 5525.816050089678, "speed/FLOPS": 244212785723440.78, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048382796347141266, "optim/lr": 1.4100219750594612e-05, "optim/total_tokens": 1971540983808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2527055740356445, "created_at": "2025-06-03T07:51:43.231943+00:00"} {"global_step": 235027, "acc_step": 0, "speed/wps": 5524.296385511802, "speed/FLOPS": 244145624327447.1, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047516245394945145, "optim/lr": 1.4096672525500066e-05, "optim/total_tokens": 1971549372416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2698129415512085, "created_at": "2025-06-03T07:51:46.203078+00:00"} {"global_step": 235028, "acc_step": 0, "speed/wps": 5530.834561872517, "speed/FLOPS": 244434578257170.34, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047826919704675674, "optim/lr": 1.4093125300405518e-05, "optim/total_tokens": 1971557761024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2629497051239014, "created_at": "2025-06-03T07:51:49.173680+00:00"} {"global_step": 235029, "acc_step": 0, "speed/wps": 5529.298659682698, "speed/FLOPS": 244366699241840.4, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.27 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.27, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05088066682219505, "optim/lr": 1.4089578075311193e-05, "optim/total_tokens": 1971566149632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.269534945487976, "created_at": "2025-06-03T07:51:52.144979+00:00"} {"global_step": 235030, "acc_step": 0, "speed/wps": 5542.5481601690435, "speed/FLOPS": 244952259346245.62, "speed/curr_iter_time": 2.9538, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9538, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 192.84, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046587008982896805, "optim/lr": 1.4086030850216647e-05, "optim/total_tokens": 1971574538240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.264702320098877, "created_at": "2025-06-03T07:51:55.106495+00:00"} {"global_step": 235031, "acc_step": 0, "speed/wps": 5542.716633681852, "speed/FLOPS": 244959705013186.16, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04650720953941345, "optim/lr": 1.40824836251221e-05, "optim/total_tokens": 1971582926848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2780543565750122, "created_at": "2025-06-03T07:51:58.069860+00:00"} {"global_step": 235032, "acc_step": 0, "speed/wps": 5543.573737269784, "speed/FLOPS": 244997584604718.9, "speed/curr_iter_time": 2.9546, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9546, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 192.9, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04719754308462143, "optim/lr": 1.4078936400027776e-05, "optim/total_tokens": 1971591315456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2659283876419067, "created_at": "2025-06-03T07:52:01.034776+00:00"} {"global_step": 235033, "acc_step": 0, "speed/wps": 5533.765516939913, "speed/FLOPS": 244564111469161.25, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045974694192409515, "optim/lr": 1.407538917493323e-05, "optim/total_tokens": 1971599704064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2619857788085938, "created_at": "2025-06-03T07:52:04.003759+00:00"} {"global_step": 235034, "acc_step": 0, "speed/wps": 5533.486836764044, "speed/FLOPS": 244551795231802.28, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04961167275905609, "optim/lr": 1.4071841949838681e-05, "optim/total_tokens": 1971608092672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2639411687850952, "created_at": "2025-06-03T07:52:06.970042+00:00"} {"global_step": 235035, "acc_step": 0, "speed/wps": 5526.089130696897, "speed/FLOPS": 244224854488526.6, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04668813943862915, "optim/lr": 1.4068294724744135e-05, "optim/total_tokens": 1971616481280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2646690607070923, "created_at": "2025-06-03T07:52:09.941678+00:00"} {"global_step": 235036, "acc_step": 0, "speed/wps": 5527.660977324273, "speed/FLOPS": 244294322064016.22, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.046795569360256195, "optim/lr": 1.406474749964981e-05, "optim/total_tokens": 1971624869888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2701643705368042, "created_at": "2025-06-03T07:52:12.910764+00:00"} {"global_step": 235037, "acc_step": 0, "speed/wps": 5523.502471003454, "speed/FLOPS": 244110537369800.94, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.047006756067276, "optim/lr": 1.4061200274555264e-05, "optim/total_tokens": 1971633258496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.266767978668213, "created_at": "2025-06-03T07:52:15.885463+00:00"} {"global_step": 235038, "acc_step": 0, "speed/wps": 5524.018465689395, "speed/FLOPS": 244133341693819.3, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04654063656926155, "optim/lr": 1.4057653049460718e-05, "optim/total_tokens": 1971641647104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2629365921020508, "created_at": "2025-06-03T07:52:18.855649+00:00"} {"global_step": 235039, "acc_step": 0, "speed/wps": 5528.921210526042, "speed/FLOPS": 244350017921076.16, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04642612114548683, "optim/lr": 1.405410582436617e-05, "optim/total_tokens": 1971650035712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2740274667739868, "created_at": "2025-06-03T07:52:21.823712+00:00"} {"global_step": 235040, "acc_step": 0, "speed/wps": 5536.493566217665, "speed/FLOPS": 244684677283815.88, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.07, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05118861049413681, "optim/lr": 1.4050558599271845e-05, "optim/total_tokens": 1971658424320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2667454481124878, "created_at": "2025-06-03T07:52:24.788214+00:00"} {"global_step": 235041, "acc_step": 0, "speed/wps": 5526.181770160529, "speed/FLOPS": 244228948678647.34, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048817891627550125, "optim/lr": 1.4047011374177299e-05, "optim/total_tokens": 1971666812928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2929062843322754, "created_at": "2025-06-03T07:52:27.762209+00:00"} {"global_step": 235042, "acc_step": 0, "speed/wps": 5531.57288426701, "speed/FLOPS": 244467208327930.3, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04802853986620903, "optim/lr": 1.4043464149082752e-05, "optim/total_tokens": 1971675201536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2743537425994873, "created_at": "2025-06-03T07:52:30.732848+00:00"} {"global_step": 235043, "acc_step": 0, "speed/wps": 5525.68862708955, "speed/FLOPS": 244207154279045.16, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04624439403414726, "optim/lr": 1.4039916923988206e-05, "optim/total_tokens": 1971683590144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2603527307510376, "created_at": "2025-06-03T07:52:33.703270+00:00"} {"global_step": 235044, "acc_step": 0, "speed/wps": 5532.508373077552, "speed/FLOPS": 244508552145090.5, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.19, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049235373735427856, "optim/lr": 1.403636969889388e-05, "optim/total_tokens": 1971691978752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2785372734069824, "created_at": "2025-06-03T07:52:36.669412+00:00"} {"global_step": 235045, "acc_step": 0, "speed/wps": 5530.561874452506, "speed/FLOPS": 244422526868946.62, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.36, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04829123988747597, "optim/lr": 1.4032822473799333e-05, "optim/total_tokens": 1971700367360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2586748600006104, "created_at": "2025-06-03T07:52:39.641113+00:00"} {"global_step": 235046, "acc_step": 0, "speed/wps": 5533.530334334628, "speed/FLOPS": 244553717601781.34, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04892617091536522, "optim/lr": 1.4029275248704787e-05, "optim/total_tokens": 1971708755968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2834795713424683, "created_at": "2025-06-03T07:52:42.608025+00:00"} {"global_step": 235047, "acc_step": 0, "speed/wps": 5532.993276186263, "speed/FLOPS": 244529982380536.4, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04893475025892258, "optim/lr": 1.402572802361024e-05, "optim/total_tokens": 1971717144576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2660315036773682, "created_at": "2025-06-03T07:52:45.576310+00:00"} {"global_step": 235048, "acc_step": 0, "speed/wps": 5531.428483840102, "speed/FLOPS": 244460826568169.38, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04761438071727753, "optim/lr": 1.4022180798515916e-05, "optim/total_tokens": 1971725533184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.270041584968567, "created_at": "2025-06-03T07:52:48.543341+00:00"} {"global_step": 235049, "acc_step": 0, "speed/wps": 5542.074049410901, "speed/FLOPS": 244931306077454.6, "speed/curr_iter_time": 2.9554, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9554, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 192.96, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04573072865605354, "optim/lr": 1.4018633573421368e-05, "optim/total_tokens": 1971733921792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2750589847564697, "created_at": "2025-06-03T07:52:51.509338+00:00"} {"global_step": 235050, "acc_step": 0, "speed/wps": 5532.866818360701, "speed/FLOPS": 244524393591916.4, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04686397314071655, "optim/lr": 1.4015086348326822e-05, "optim/total_tokens": 1971742310400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2604706287384033, "created_at": "2025-06-03T07:52:54.477502+00:00"} {"global_step": 235051, "acc_step": 0, "speed/wps": 5529.28042284349, "speed/FLOPS": 244365893266892.03, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.34, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0541250966489315, "optim/lr": 1.4011539123232275e-05, "optim/total_tokens": 1971750699008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2772212028503418, "created_at": "2025-06-03T07:52:57.444991+00:00"} {"global_step": 235052, "acc_step": 0, "speed/wps": 5531.791141301018, "speed/FLOPS": 244476854171692.72, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.32, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.050656188279390335, "optim/lr": 1.400799189813795e-05, "optim/total_tokens": 1971759087616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2553610801696777, "created_at": "2025-06-03T07:53:00.411855+00:00"} {"global_step": 235053, "acc_step": 0, "speed/wps": 5519.937313684358, "speed/FLOPS": 243952975664426.28, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.048808544874191284, "optim/lr": 1.4004444673043404e-05, "optim/total_tokens": 1971767476224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2683581113815308, "created_at": "2025-06-03T07:53:03.388073+00:00"} {"global_step": 235054, "acc_step": 0, "speed/wps": 5530.478761764597, "speed/FLOPS": 244418853713550.34, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04552518576383591, "optim/lr": 1.4000897447948856e-05, "optim/total_tokens": 1971775864832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264451503753662, "created_at": "2025-06-03T07:53:06.360080+00:00"} {"global_step": 235055, "acc_step": 0, "speed/wps": 5528.57045617089, "speed/FLOPS": 244334516373901.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0462830625474453, "optim/lr": 1.399735022285431e-05, "optim/total_tokens": 1971784253440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2754648923873901, "created_at": "2025-06-03T07:53:09.331794+00:00"} {"global_step": 235056, "acc_step": 0, "speed/wps": 5528.16914507131, "speed/FLOPS": 244316780477396.94, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04530069977045059, "optim/lr": 1.3993802997759985e-05, "optim/total_tokens": 1971792642048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2654668092727661, "created_at": "2025-06-03T07:53:12.300207+00:00"} {"global_step": 235057, "acc_step": 0, "speed/wps": 5521.543016019372, "speed/FLOPS": 244023939488904.28, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04876893386244774, "optim/lr": 1.3990255772665439e-05, "optim/total_tokens": 1971801030656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2689399719238281, "created_at": "2025-06-03T07:53:15.272169+00:00"} {"global_step": 235058, "acc_step": 0, "speed/wps": 5536.330716869035, "speed/FLOPS": 244677480176144.97, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.17, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04760385677218437, "optim/lr": 1.3986708547570893e-05, "optim/total_tokens": 1971809419264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2680935859680176, "created_at": "2025-06-03T07:53:18.239903+00:00"} {"global_step": 235059, "acc_step": 0, "speed/wps": 5526.059666714435, "speed/FLOPS": 244223552331312.1, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04774137958884239, "optim/lr": 1.3983161322476568e-05, "optim/total_tokens": 1971817807872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2715795040130615, "created_at": "2025-06-03T07:53:21.209083+00:00"} {"global_step": 235060, "acc_step": 0, "speed/wps": 5528.330186481164, "speed/FLOPS": 244323897683427.8, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04584461823105812, "optim/lr": 1.397961409738202e-05, "optim/total_tokens": 1971826196480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2939471006393433, "created_at": "2025-06-03T07:53:24.181209+00:00"} {"global_step": 235061, "acc_step": 0, "speed/wps": 5519.590498970033, "speed/FLOPS": 243937648229211.75, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.05045761168003082, "optim/lr": 1.3976066872287474e-05, "optim/total_tokens": 1971834585088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2639086246490479, "created_at": "2025-06-03T07:53:27.158123+00:00"} {"global_step": 235062, "acc_step": 0, "speed/wps": 5513.952428151039, "speed/FLOPS": 243688474357274.75, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.25 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.25, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04727478697896004, "optim/lr": 1.3972519647192927e-05, "optim/total_tokens": 1971842973696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2663466930389404, "created_at": "2025-06-03T07:53:30.135638+00:00"} {"global_step": 235063, "acc_step": 0, "speed/wps": 5528.059902124981, "speed/FLOPS": 244311952498325.28, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04896262288093567, "optim/lr": 1.3968972422098603e-05, "optim/total_tokens": 1971851362304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2729917764663696, "created_at": "2025-06-03T07:53:33.107950+00:00"} {"global_step": 235064, "acc_step": 0, "speed/wps": 5524.670831743991, "speed/FLOPS": 244162172934320.25, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045594144612550735, "optim/lr": 1.3965425197004056e-05, "optim/total_tokens": 1971859750912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2718243598937988, "created_at": "2025-06-03T07:53:36.081468+00:00"} {"global_step": 235065, "acc_step": 0, "speed/wps": 5518.301299386919, "speed/FLOPS": 243880672206359.75, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.051333025097846985, "optim/lr": 1.3961877971909508e-05, "optim/total_tokens": 1971868139520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2601767778396606, "created_at": "2025-06-03T07:53:39.055441+00:00"} {"global_step": 235066, "acc_step": 0, "speed/wps": 5533.3487046163655, "speed/FLOPS": 244545690497899.34, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04608853906393051, "optim/lr": 1.3958330746814962e-05, "optim/total_tokens": 1971876528128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.266987919807434, "created_at": "2025-06-03T07:53:42.026435+00:00"} {"global_step": 235067, "acc_step": 0, "speed/wps": 5524.540483176383, "speed/FLOPS": 244156412194816.44, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04517339542508125, "optim/lr": 1.3954783521720637e-05, "optim/total_tokens": 1971884916736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2615649700164795, "created_at": "2025-06-03T07:53:44.997104+00:00"} {"global_step": 235068, "acc_step": 0, "speed/wps": 5535.713865812776, "speed/FLOPS": 244650218516788.25, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.2, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05176078900694847, "optim/lr": 1.3951236296626091e-05, "optim/total_tokens": 1971893305344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2617640495300293, "created_at": "2025-06-03T07:53:47.964241+00:00"} {"global_step": 235069, "acc_step": 0, "speed/wps": 5519.619153661991, "speed/FLOPS": 243938914619928.25, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.0456918440759182, "optim/lr": 1.3947689071531545e-05, "optim/total_tokens": 1971901693952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.275779366493225, "created_at": "2025-06-03T07:53:50.940627+00:00"} {"global_step": 235070, "acc_step": 0, "speed/wps": 5510.239113457671, "speed/FLOPS": 243524364854295.44, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.049716681241989136, "optim/lr": 1.3944141846436997e-05, "optim/total_tokens": 1971910082560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2896732091903687, "created_at": "2025-06-03T07:53:53.919568+00:00"} {"global_step": 235071, "acc_step": 0, "speed/wps": 5525.938578882316, "speed/FLOPS": 244218200868916.12, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04781452193856239, "optim/lr": 1.3940594621342672e-05, "optim/total_tokens": 1971918471168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2712981700897217, "created_at": "2025-06-03T07:53:56.889342+00:00"} {"global_step": 235072, "acc_step": 0, "speed/wps": 5527.590228837582, "speed/FLOPS": 244291195343028.06, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.051955509930849075, "optim/lr": 1.3937047396248126e-05, "optim/total_tokens": 1971926859776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2798488140106201, "created_at": "2025-06-03T07:53:59.862575+00:00"} {"global_step": 235073, "acc_step": 0, "speed/wps": 5523.976061552134, "speed/FLOPS": 244131467647996.38, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.62, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04707949981093407, "optim/lr": 1.393350017115358e-05, "optim/total_tokens": 1971935248384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2607755661010742, "created_at": "2025-06-03T07:54:02.833604+00:00"} {"global_step": 235074, "acc_step": 0, "speed/wps": 5528.368583527438, "speed/FLOPS": 244325594636339.25, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047648411244153976, "optim/lr": 1.3929952946059033e-05, "optim/total_tokens": 1971943636992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2575430870056152, "created_at": "2025-06-03T07:54:05.805518+00:00"} {"global_step": 235075, "acc_step": 0, "speed/wps": 5470.337998124498, "speed/FLOPS": 241760939788991.56, "speed/curr_iter_time": 2.9941, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9941, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "3.26 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 3.26, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.045621033757925034, "optim/lr": 1.3926405720964708e-05, "optim/total_tokens": 1971952025600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.250101923942566, "created_at": "2025-06-03T07:54:08.809589+00:00"} {"global_step": 235076, "acc_step": 0, "speed/wps": 5521.421840542316, "speed/FLOPS": 244018584153050.75, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047495439648628235, "optim/lr": 1.392285849587016e-05, "optim/total_tokens": 1971960414208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2677398920059204, "created_at": "2025-06-03T07:54:11.783519+00:00"} {"global_step": 235077, "acc_step": 0, "speed/wps": 5518.013499849619, "speed/FLOPS": 243867952939902.66, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04820369556546211, "optim/lr": 1.3919311270775614e-05, "optim/total_tokens": 1971968802816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.276501178741455, "created_at": "2025-06-03T07:54:14.758489+00:00"} {"global_step": 235078, "acc_step": 0, "speed/wps": 5520.778782442689, "speed/FLOPS": 243990164276516.94, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045380037277936935, "optim/lr": 1.3915764045681068e-05, "optim/total_tokens": 1971977191424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2697399854660034, "created_at": "2025-06-03T07:54:17.732186+00:00"} {"global_step": 235079, "acc_step": 0, "speed/wps": 5501.295778112706, "speed/FLOPS": 243129115208188.0, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.14, "optim/grad_norm": 0.04709125682711601, "optim/lr": 1.3912216820586743e-05, "optim/total_tokens": 1971985580032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2630321979522705, "created_at": "2025-06-03T07:54:20.717626+00:00"} {"global_step": 235080, "acc_step": 0, "speed/wps": 5511.642692668354, "speed/FLOPS": 243586395871237.97, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.24 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.24, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047696515917778015, "optim/lr": 1.3908669595492197e-05, "optim/total_tokens": 1971993968640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.264672040939331, "created_at": "2025-06-03T07:54:23.697657+00:00"} {"global_step": 235081, "acc_step": 0, "speed/wps": 5536.849727249762, "speed/FLOPS": 244700417778437.12, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.08, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0458533838391304, "optim/lr": 1.3905122370397649e-05, "optim/total_tokens": 1972002357248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2597287893295288, "created_at": "2025-06-03T07:54:26.664124+00:00"} {"global_step": 235082, "acc_step": 0, "speed/wps": 5511.311522920925, "speed/FLOPS": 243571759863482.03, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05047398805618286, "optim/lr": 1.3901575145303102e-05, "optim/total_tokens": 1972010745856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2631471157073975, "created_at": "2025-06-03T07:54:29.641954+00:00"} {"global_step": 235083, "acc_step": 0, "speed/wps": 5516.05791070767, "speed/FLOPS": 243781525909441.16, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04605153948068619, "optim/lr": 1.3898027920208778e-05, "optim/total_tokens": 1972019134464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2634137868881226, "created_at": "2025-06-03T07:54:32.620882+00:00"} {"global_step": 235084, "acc_step": 0, "speed/wps": 5522.703116190617, "speed/FLOPS": 244075209978542.38, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05202421918511391, "optim/lr": 1.3894480695114231e-05, "optim/total_tokens": 1972027523072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2555055618286133, "created_at": "2025-06-03T07:54:35.597116+00:00"} {"global_step": 235085, "acc_step": 0, "speed/wps": 5533.45546588634, "speed/FLOPS": 244550408799578.47, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.29, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04759833589196205, "optim/lr": 1.3890933470019685e-05, "optim/total_tokens": 1972035911680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.267653226852417, "created_at": "2025-06-03T07:54:38.563400+00:00"} {"global_step": 235086, "acc_step": 0, "speed/wps": 5522.005885077842, "speed/FLOPS": 244044395932110.06, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05166962742805481, "optim/lr": 1.3887386244925359e-05, "optim/total_tokens": 1972044300288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.26255464553833, "created_at": "2025-06-03T07:54:41.541982+00:00"} {"global_step": 235087, "acc_step": 0, "speed/wps": 5531.687531213022, "speed/FLOPS": 244472275136127.8, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.36, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04903734102845192, "optim/lr": 1.3883839019830812e-05, "optim/total_tokens": 1972052688896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2683008909225464, "created_at": "2025-06-03T07:54:44.515182+00:00"} {"global_step": 235088, "acc_step": 0, "speed/wps": 5510.5351810232305, "speed/FLOPS": 243537449525282.0, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04734012112021446, "optim/lr": 1.3880291794736266e-05, "optim/total_tokens": 1972061077504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2663938999176025, "created_at": "2025-06-03T07:54:47.493671+00:00"} {"global_step": 235089, "acc_step": 0, "speed/wps": 5529.997593824537, "speed/FLOPS": 244397588553440.47, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04769306629896164, "optim/lr": 1.387674456964172e-05, "optim/total_tokens": 1972069466112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2937862873077393, "created_at": "2025-06-03T07:54:50.464489+00:00"} {"global_step": 235090, "acc_step": 0, "speed/wps": 5527.0588956186375, "speed/FLOPS": 244267713134360.7, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046838514506816864, "optim/lr": 1.3873197344547395e-05, "optim/total_tokens": 1972077854720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2640886306762695, "created_at": "2025-06-03T07:54:53.435479+00:00"} {"global_step": 235091, "acc_step": 0, "speed/wps": 5522.733017273023, "speed/FLOPS": 244076531453337.06, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04916246980428696, "optim/lr": 1.3869650119452849e-05, "optim/total_tokens": 1972086243328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.259941577911377, "created_at": "2025-06-03T07:54:56.406530+00:00"} {"global_step": 235092, "acc_step": 0, "speed/wps": 5526.606930908526, "speed/FLOPS": 244247738607538.84, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04992695525288582, "optim/lr": 1.38661028943583e-05, "optim/total_tokens": 1972094631936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.26589035987854, "created_at": "2025-06-03T07:54:59.379019+00:00"} {"global_step": 235093, "acc_step": 0, "speed/wps": 5520.490936214327, "speed/FLOPS": 243977442946553.9, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04874333366751671, "optim/lr": 1.3862555669263754e-05, "optim/total_tokens": 1972103020544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2740166187286377, "created_at": "2025-06-03T07:55:02.351001+00:00"} {"global_step": 235094, "acc_step": 0, "speed/wps": 5521.611144522416, "speed/FLOPS": 244026950420025.56, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.62, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.049844980239868164, "optim/lr": 1.385900844416943e-05, "optim/total_tokens": 1972111409152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.255645751953125, "created_at": "2025-06-03T07:55:05.326805+00:00"} {"global_step": 235095, "acc_step": 0, "speed/wps": 5523.234140688705, "speed/FLOPS": 244098678543328.1, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046634968370199203, "optim/lr": 1.3855461219074883e-05, "optim/total_tokens": 1972119797760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2724812030792236, "created_at": "2025-06-03T07:55:08.302074+00:00"} {"global_step": 235096, "acc_step": 0, "speed/wps": 5502.102029638146, "speed/FLOPS": 243164747398843.0, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.23 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.23, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05188222602009773, "optim/lr": 1.3851913993980337e-05, "optim/total_tokens": 1972128186368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.268332839012146, "created_at": "2025-06-03T07:55:11.284531+00:00"} {"global_step": 235097, "acc_step": 0, "speed/wps": 5538.754817809185, "speed/FLOPS": 244784613030026.2, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.12, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05007155239582062, "optim/lr": 1.3848366768885789e-05, "optim/total_tokens": 1972136574976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2547409534454346, "created_at": "2025-06-03T07:55:14.247650+00:00"} {"global_step": 235098, "acc_step": 0, "speed/wps": 5531.7832894386565, "speed/FLOPS": 244476507159565.8, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.050589654594659805, "optim/lr": 1.3844819543791464e-05, "optim/total_tokens": 1972144963584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2663674354553223, "created_at": "2025-06-03T07:55:17.213766+00:00"} {"global_step": 235099, "acc_step": 0, "speed/wps": 5526.074327713287, "speed/FLOPS": 244224200272419.56, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05554257333278656, "optim/lr": 1.3841272318696918e-05, "optim/total_tokens": 1972153352192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2752327919006348, "created_at": "2025-06-03T07:55:20.184800+00:00"} {"global_step": 235100, "acc_step": 0, "speed/wps": 5513.856943203804, "speed/FLOPS": 243684254411343.2, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.22 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.22, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05090993270277977, "optim/lr": 1.3837725093602372e-05, "optim/total_tokens": 1972161740800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2823153734207153, "created_at": "2025-06-03T07:55:23.160539+00:00"} {"global_step": 235101, "acc_step": 0, "speed/wps": 5521.237800843754, "speed/FLOPS": 244010450540374.84, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0514342375099659, "optim/lr": 1.3834177868507825e-05, "optim/total_tokens": 1972170129408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2603291273117065, "created_at": "2025-06-03T07:55:26.132204+00:00"} {"global_step": 235102, "acc_step": 0, "speed/wps": 5527.945362505375, "speed/FLOPS": 244306890433405.62, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04648037254810333, "optim/lr": 1.3830630643413499e-05, "optim/total_tokens": 1972178518016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2595614194869995, "created_at": "2025-06-03T07:55:29.103754+00:00"} {"global_step": 235103, "acc_step": 0, "speed/wps": 5523.9266068533825, "speed/FLOPS": 244129282003443.7, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04649818688631058, "optim/lr": 1.3827083418318953e-05, "optim/total_tokens": 1972186906624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2826850414276123, "created_at": "2025-06-03T07:55:32.074388+00:00"} {"global_step": 235104, "acc_step": 0, "speed/wps": 5513.224966031562, "speed/FLOPS": 243656324255082.5, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04661282151937485, "optim/lr": 1.3823536193224406e-05, "optim/total_tokens": 1972195295232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2598729133605957, "created_at": "2025-06-03T07:55:35.050699+00:00"} {"global_step": 235105, "acc_step": 0, "speed/wps": 5516.14830507191, "speed/FLOPS": 243785520877660.25, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04597225412726402, "optim/lr": 1.381998896812986e-05, "optim/total_tokens": 1972203683840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2735543251037598, "created_at": "2025-06-03T07:55:38.024653+00:00"} {"global_step": 235106, "acc_step": 0, "speed/wps": 5527.008023031626, "speed/FLOPS": 244265464826404.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04878120869398117, "optim/lr": 1.3816441743035535e-05, "optim/total_tokens": 1972212072448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2765142917633057, "created_at": "2025-06-03T07:55:40.997094+00:00"} {"global_step": 235107, "acc_step": 0, "speed/wps": 5523.885447315275, "speed/FLOPS": 244127462962532.94, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046651680022478104, "optim/lr": 1.3812894517940987e-05, "optim/total_tokens": 1972220461056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.261637568473816, "created_at": "2025-06-03T07:55:43.968177+00:00"} {"global_step": 235108, "acc_step": 0, "speed/wps": 5523.159389762704, "speed/FLOPS": 244095374935008.78, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048253133893013, "optim/lr": 1.3809347292846441e-05, "optim/total_tokens": 1972228849664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2791591882705688, "created_at": "2025-06-03T07:55:46.943049+00:00"} {"global_step": 235109, "acc_step": 0, "speed/wps": 5510.746375736799, "speed/FLOPS": 243546783250629.16, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04754205420613289, "optim/lr": 1.3805800067751895e-05, "optim/total_tokens": 1972237238272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2813290357589722, "created_at": "2025-06-03T07:55:49.924620+00:00"} {"global_step": 235110, "acc_step": 0, "speed/wps": 5514.717404395823, "speed/FLOPS": 243722282391790.8, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04963609203696251, "optim/lr": 1.380225284265757e-05, "optim/total_tokens": 1972245626880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.276354193687439, "created_at": "2025-06-03T07:55:52.904349+00:00"} {"global_step": 235111, "acc_step": 0, "speed/wps": 5515.980696489763, "speed/FLOPS": 243778113436227.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04803567752242088, "optim/lr": 1.3798705617563024e-05, "optim/total_tokens": 1972254015488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2802112102508545, "created_at": "2025-06-03T07:55:55.883858+00:00"} {"global_step": 235112, "acc_step": 0, "speed/wps": 5521.23963936488, "speed/FLOPS": 244010531793598.22, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04591040685772896, "optim/lr": 1.3795158392468477e-05, "optim/total_tokens": 1972262404096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2599151134490967, "created_at": "2025-06-03T07:55:58.860105+00:00"} {"global_step": 235113, "acc_step": 0, "speed/wps": 5518.739478785403, "speed/FLOPS": 243900037492967.25, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04640692472457886, "optim/lr": 1.3791611167374151e-05, "optim/total_tokens": 1972270792704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2644249200820923, "created_at": "2025-06-03T07:56:01.833339+00:00"} {"global_step": 235114, "acc_step": 0, "speed/wps": 5520.026799470541, "speed/FLOPS": 243956930478145.78, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046930089592933655, "optim/lr": 1.3788063942279605e-05, "optim/total_tokens": 1972279181312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2583963871002197, "created_at": "2025-06-03T07:56:04.806781+00:00"} {"global_step": 235115, "acc_step": 0, "speed/wps": 5518.052608744781, "speed/FLOPS": 243869681352891.34, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0459492951631546, "optim/lr": 1.3784516717185058e-05, "optim/total_tokens": 1972287569920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2736557722091675, "created_at": "2025-06-03T07:56:07.782982+00:00"} {"global_step": 235116, "acc_step": 0, "speed/wps": 5523.357610668176, "speed/FLOPS": 244104135284444.03, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04643702134490013, "optim/lr": 1.3780969492090512e-05, "optim/total_tokens": 1972295958528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2654374837875366, "created_at": "2025-06-03T07:56:10.754053+00:00"} {"global_step": 235117, "acc_step": 0, "speed/wps": 5519.073752048077, "speed/FLOPS": 243914810660211.8, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05408907309174538, "optim/lr": 1.3777422266996187e-05, "optim/total_tokens": 1972304347136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2823394536972046, "created_at": "2025-06-03T07:56:13.731142+00:00"} {"global_step": 235118, "acc_step": 0, "speed/wps": 5525.308299654856, "speed/FLOPS": 244190345753123.94, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047230515629053116, "optim/lr": 1.377387504190164e-05, "optim/total_tokens": 1972312735744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.252927541732788, "created_at": "2025-06-03T07:56:16.700861+00:00"} {"global_step": 235119, "acc_step": 0, "speed/wps": 5523.397905658156, "speed/FLOPS": 244105916116752.7, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05310302600264549, "optim/lr": 1.3770327816807093e-05, "optim/total_tokens": 1972321124352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2745118141174316, "created_at": "2025-06-03T07:56:19.671763+00:00"} {"global_step": 235120, "acc_step": 0, "speed/wps": 5520.2431771362735, "speed/FLOPS": 243966493263449.88, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04699943959712982, "optim/lr": 1.3766780591712547e-05, "optim/total_tokens": 1972329512960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2512140274047852, "created_at": "2025-06-03T07:56:22.644471+00:00"} {"global_step": 235121, "acc_step": 0, "speed/wps": 5510.636162730697, "speed/FLOPS": 243541912399880.78, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048164818435907364, "optim/lr": 1.3763233366618222e-05, "optim/total_tokens": 1972337901568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2739320993423462, "created_at": "2025-06-03T07:56:25.622451+00:00"} {"global_step": 235122, "acc_step": 0, "speed/wps": 5496.628267834569, "speed/FLOPS": 242922835144377.66, "speed/curr_iter_time": 2.9799, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9799, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "3.21 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 3.21, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0491272434592247, "optim/lr": 1.3759686141523676e-05, "optim/total_tokens": 1972346290176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2675814628601074, "created_at": "2025-06-03T07:56:28.610382+00:00"} {"global_step": 235123, "acc_step": 0, "speed/wps": 5535.612944465338, "speed/FLOPS": 244645758309793.75, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 193.24, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04862505570054054, "optim/lr": 1.3756138916429128e-05, "optim/total_tokens": 1972354678784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.279598593711853, "created_at": "2025-06-03T07:56:31.574927+00:00"} {"global_step": 235124, "acc_step": 0, "speed/wps": 5529.82474358999, "speed/FLOPS": 244389949457801.2, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04629843309521675, "optim/lr": 1.3752591691334581e-05, "optim/total_tokens": 1972363067392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2494490146636963, "created_at": "2025-06-03T07:56:34.541871+00:00"} {"global_step": 235125, "acc_step": 0, "speed/wps": 5507.924621883725, "speed/FLOPS": 243422076173368.84, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04600929468870163, "optim/lr": 1.3749044466240257e-05, "optim/total_tokens": 1972371456000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2707101106643677, "created_at": "2025-06-03T07:56:37.521572+00:00"} {"global_step": 235126, "acc_step": 0, "speed/wps": 5513.628191050547, "speed/FLOPS": 243674144737028.88, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04760730639100075, "optim/lr": 1.374549724114571e-05, "optim/total_tokens": 1972379844608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2649009227752686, "created_at": "2025-06-03T07:56:40.502177+00:00"} {"global_step": 235127, "acc_step": 0, "speed/wps": 5508.390707229261, "speed/FLOPS": 243442674760000.47, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046358224004507065, "optim/lr": 1.3741950016051164e-05, "optim/total_tokens": 1972388233216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2612653970718384, "created_at": "2025-06-03T07:56:43.483929+00:00"} {"global_step": 235128, "acc_step": 0, "speed/wps": 5518.107766197295, "speed/FLOPS": 243872119029971.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048414360731840134, "optim/lr": 1.3738402790956616e-05, "optim/total_tokens": 1972396621824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2647545337677002, "created_at": "2025-06-03T07:56:46.462524+00:00"} {"global_step": 235129, "acc_step": 0, "speed/wps": 5502.249064555322, "speed/FLOPS": 243171245589589.25, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04654395952820778, "optim/lr": 1.3734855565862291e-05, "optim/total_tokens": 1972405010432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2773061990737915, "created_at": "2025-06-03T07:56:49.449745+00:00"} {"global_step": 235130, "acc_step": 0, "speed/wps": 5509.154070635107, "speed/FLOPS": 243476411515290.72, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.2 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.2, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0457884818315506, "optim/lr": 1.3731308340767745e-05, "optim/total_tokens": 1972413399040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.257492184638977, "created_at": "2025-06-03T07:56:52.428721+00:00"} {"global_step": 235131, "acc_step": 0, "speed/wps": 5532.744113072405, "speed/FLOPS": 244518970646236.3, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.28, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0456995964050293, "optim/lr": 1.3727761115673199e-05, "optim/total_tokens": 1972421787648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2676098346710205, "created_at": "2025-06-03T07:56:55.394568+00:00"} {"global_step": 235132, "acc_step": 0, "speed/wps": 5529.949906864928, "speed/FLOPS": 244395481033909.75, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04635784775018692, "optim/lr": 1.3724213890578652e-05, "optim/total_tokens": 1972430176256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2721199989318848, "created_at": "2025-06-03T07:56:58.361987+00:00"} {"global_step": 235133, "acc_step": 0, "speed/wps": 5524.7010560262925, "speed/FLOPS": 244163508692896.1, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04588516056537628, "optim/lr": 1.3720666665484328e-05, "optim/total_tokens": 1972438564864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2624679803848267, "created_at": "2025-06-03T07:57:01.332141+00:00"} {"global_step": 235134, "acc_step": 0, "speed/wps": 5527.668265602037, "speed/FLOPS": 244294644168588.6, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04799604043364525, "optim/lr": 1.371711944038978e-05, "optim/total_tokens": 1972446953472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2660762071609497, "created_at": "2025-06-03T07:57:04.300289+00:00"} {"global_step": 235135, "acc_step": 0, "speed/wps": 5519.143638141333, "speed/FLOPS": 243917899267824.28, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04603919759392738, "optim/lr": 1.3713572215295233e-05, "optim/total_tokens": 1972455342080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2747894525527954, "created_at": "2025-06-03T07:57:07.278544+00:00"} {"global_step": 235136, "acc_step": 0, "speed/wps": 5512.037889923644, "speed/FLOPS": 243603861567118.84, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047834813594818115, "optim/lr": 1.3710024990200687e-05, "optim/total_tokens": 1972463730688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2713103294372559, "created_at": "2025-06-03T07:57:10.255320+00:00"} {"global_step": 235137, "acc_step": 0, "speed/wps": 5509.894887373226, "speed/FLOPS": 243509151823271.78, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045387689024209976, "optim/lr": 1.3706477765106362e-05, "optim/total_tokens": 1972472119296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2679791450500488, "created_at": "2025-06-03T07:57:13.233113+00:00"} {"global_step": 235138, "acc_step": 0, "speed/wps": 5520.130035986661, "speed/FLOPS": 243961493003745.9, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04653150588274002, "optim/lr": 1.3702930540011816e-05, "optim/total_tokens": 1972480507904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2707680463790894, "created_at": "2025-06-03T07:57:16.206148+00:00"} {"global_step": 235139, "acc_step": 0, "speed/wps": 5520.433954620141, "speed/FLOPS": 243974924651749.12, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.049268390983343124, "optim/lr": 1.3699383314917268e-05, "optim/total_tokens": 1972488896512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2736626863479614, "created_at": "2025-06-03T07:57:19.178763+00:00"} {"global_step": 235140, "acc_step": 0, "speed/wps": 5521.552875998324, "speed/FLOPS": 244024375249506.06, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045853983610868454, "optim/lr": 1.3695836089822943e-05, "optim/total_tokens": 1972497285120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2700748443603516, "created_at": "2025-06-03T07:57:22.150541+00:00"} {"global_step": 235141, "acc_step": 0, "speed/wps": 5527.4685476913255, "speed/FLOPS": 244285817659184.1, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.06321649998426437, "optim/lr": 1.3692288864728397e-05, "optim/total_tokens": 1972505673728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.271081566810608, "created_at": "2025-06-03T07:57:25.121483+00:00"} {"global_step": 235142, "acc_step": 0, "speed/wps": 5521.776519552565, "speed/FLOPS": 244034259149892.0, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.66, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04566680267453194, "optim/lr": 1.368874163963385e-05, "optim/total_tokens": 1972514062336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2614107131958008, "created_at": "2025-06-03T07:57:28.093569+00:00"} {"global_step": 235143, "acc_step": 0, "speed/wps": 5519.298942434296, "speed/FLOPS": 243924762922653.78, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05138106644153595, "optim/lr": 1.3685194414539304e-05, "optim/total_tokens": 1972522450944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.256980061531067, "created_at": "2025-06-03T07:57:31.070033+00:00"} {"global_step": 235144, "acc_step": 0, "speed/wps": 5511.206371064379, "speed/FLOPS": 243567112689638.7, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04671754688024521, "optim/lr": 1.3681647189444978e-05, "optim/total_tokens": 1972530839552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2726266384124756, "created_at": "2025-06-03T07:57:34.049929+00:00"} {"global_step": 235145, "acc_step": 0, "speed/wps": 5512.933536511366, "speed/FLOPS": 243643444561961.34, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047428663820028305, "optim/lr": 1.3678099964350432e-05, "optim/total_tokens": 1972539228160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2762982845306396, "created_at": "2025-06-03T07:57:37.025983+00:00"} {"global_step": 235146, "acc_step": 0, "speed/wps": 5510.8438327401755, "speed/FLOPS": 243551090351348.25, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.18 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.18, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04731940105557442, "optim/lr": 1.3674552739255885e-05, "optim/total_tokens": 1972547616768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2750564813613892, "created_at": "2025-06-03T07:57:40.008253+00:00"} {"global_step": 235147, "acc_step": 0, "speed/wps": 5526.201125338692, "speed/FLOPS": 244229804078453.38, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0457659475505352, "optim/lr": 1.3671005514161339e-05, "optim/total_tokens": 1972556005376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.246806025505066, "created_at": "2025-06-03T07:57:42.977193+00:00"} {"global_step": 235148, "acc_step": 0, "speed/wps": 5528.781737644369, "speed/FLOPS": 244343853933593.12, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047237545251846313, "optim/lr": 1.3667458289067014e-05, "optim/total_tokens": 1972564393984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2580182552337646, "created_at": "2025-06-03T07:57:45.944486+00:00"} {"global_step": 235149, "acc_step": 0, "speed/wps": 5531.1961327926865, "speed/FLOPS": 244450557841154.1, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04681166633963585, "optim/lr": 1.3663911063972468e-05, "optim/total_tokens": 1972572782592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2649834156036377, "created_at": "2025-06-03T07:57:48.914559+00:00"} {"global_step": 235150, "acc_step": 0, "speed/wps": 5520.260677117913, "speed/FLOPS": 243967266673065.28, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04779521003365517, "optim/lr": 1.366036383887792e-05, "optim/total_tokens": 1972581171200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2643474340438843, "created_at": "2025-06-03T07:57:51.891179+00:00"} {"global_step": 235151, "acc_step": 0, "speed/wps": 5521.960146683582, "speed/FLOPS": 244042374529194.1, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047999151051044464, "optim/lr": 1.3656816613783374e-05, "optim/total_tokens": 1972589559808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2712708711624146, "created_at": "2025-06-03T07:57:54.866837+00:00"} {"global_step": 235152, "acc_step": 0, "speed/wps": 5525.2115342620045, "speed/FLOPS": 244186069218050.1, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04528909921646118, "optim/lr": 1.3653269388689049e-05, "optim/total_tokens": 1972597948416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2525192499160767, "created_at": "2025-06-03T07:57:57.836732+00:00"} {"global_step": 235153, "acc_step": 0, "speed/wps": 5518.30729938849, "speed/FLOPS": 243880937375718.4, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04559968039393425, "optim/lr": 1.3649722163594503e-05, "optim/total_tokens": 1972606337024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.261405110359192, "created_at": "2025-06-03T07:58:00.810384+00:00"} {"global_step": 235154, "acc_step": 0, "speed/wps": 5515.54594145966, "speed/FLOPS": 243758899489175.25, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0479741171002388, "optim/lr": 1.3646174938499956e-05, "optim/total_tokens": 1972614725632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2840286493301392, "created_at": "2025-06-03T07:58:03.788798+00:00"} {"global_step": 235155, "acc_step": 0, "speed/wps": 5518.201952681952, "speed/FLOPS": 243876281590502.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04758000746369362, "optim/lr": 1.3642627713405408e-05, "optim/total_tokens": 1972623114240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.263779640197754, "created_at": "2025-06-03T07:58:06.762466+00:00"} {"global_step": 235156, "acc_step": 0, "speed/wps": 5525.765046772937, "speed/FLOPS": 244210531637899.47, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04931887611746788, "optim/lr": 1.3639080488311084e-05, "optim/total_tokens": 1972631502848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2658674716949463, "created_at": "2025-06-03T07:58:09.734384+00:00"} {"global_step": 235157, "acc_step": 0, "speed/wps": 5526.0538945967255, "speed/FLOPS": 244223297233253.72, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04601537063717842, "optim/lr": 1.3635533263216537e-05, "optim/total_tokens": 1972639891456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.271583914756775, "created_at": "2025-06-03T07:58:12.708724+00:00"} {"global_step": 235158, "acc_step": 0, "speed/wps": 5511.643290141579, "speed/FLOPS": 243586422276496.38, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05010043829679489, "optim/lr": 1.3631986038121991e-05, "optim/total_tokens": 1972648280064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2596352100372314, "created_at": "2025-06-03T07:58:15.691822+00:00"} {"global_step": 235159, "acc_step": 0, "speed/wps": 5525.137747103404, "speed/FLOPS": 244182808203316.88, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04621170833706856, "optim/lr": 1.3628438813027445e-05, "optim/total_tokens": 1972656668672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2604000568389893, "created_at": "2025-06-03T07:58:18.665112+00:00"} {"global_step": 235160, "acc_step": 0, "speed/wps": 5520.73013644765, "speed/FLOPS": 243988014372529.0, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04716050997376442, "optim/lr": 1.3624891587933118e-05, "optim/total_tokens": 1972665057280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2664066553115845, "created_at": "2025-06-03T07:58:21.638330+00:00"} {"global_step": 235161, "acc_step": 0, "speed/wps": 5521.481550299005, "speed/FLOPS": 244021223018674.16, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046153560280799866, "optim/lr": 1.3621344362838572e-05, "optim/total_tokens": 1972673445888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2740050554275513, "created_at": "2025-06-03T07:58:24.610432+00:00"} {"global_step": 235162, "acc_step": 0, "speed/wps": 5512.617393377495, "speed/FLOPS": 243629472653611.53, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04711631312966347, "optim/lr": 1.3617797137744026e-05, "optim/total_tokens": 1972681834496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.273748755455017, "created_at": "2025-06-03T07:58:27.587246+00:00"} {"global_step": 235163, "acc_step": 0, "speed/wps": 5515.36688670078, "speed/FLOPS": 243750986185318.1, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04565059766173363, "optim/lr": 1.361424991264948e-05, "optim/total_tokens": 1972690223104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2847440242767334, "created_at": "2025-06-03T07:58:30.562761+00:00"} {"global_step": 235164, "acc_step": 0, "speed/wps": 5511.709569030507, "speed/FLOPS": 243589351464140.88, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.17 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.17, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047016970813274384, "optim/lr": 1.3610702687555155e-05, "optim/total_tokens": 1972698611712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2489744424819946, "created_at": "2025-06-03T07:58:33.540176+00:00"} {"global_step": 235165, "acc_step": 0, "speed/wps": 5532.058885925545, "speed/FLOPS": 244488687113655.6, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04620389640331268, "optim/lr": 1.3607155462460607e-05, "optim/total_tokens": 1972707000320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.262679934501648, "created_at": "2025-06-03T07:58:36.506643+00:00"} {"global_step": 235166, "acc_step": 0, "speed/wps": 5529.622473435543, "speed/FLOPS": 244381010152287.12, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.5, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04860888049006462, "optim/lr": 1.360360823736606e-05, "optim/total_tokens": 1972715388928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2780035734176636, "created_at": "2025-06-03T07:58:39.478169+00:00"} {"global_step": 235167, "acc_step": 0, "speed/wps": 5517.506824033128, "speed/FLOPS": 243845560462215.72, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045934293419122696, "optim/lr": 1.3600061012271736e-05, "optim/total_tokens": 1972723777536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2631158828735352, "created_at": "2025-06-03T07:58:42.452008+00:00"} {"global_step": 235168, "acc_step": 0, "speed/wps": 5526.7065978465425, "speed/FLOPS": 244252143376057.53, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04650888964533806, "optim/lr": 1.359651378717719e-05, "optim/total_tokens": 1972732166144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.266092300415039, "created_at": "2025-06-03T07:58:45.425168+00:00"} {"global_step": 235169, "acc_step": 0, "speed/wps": 5523.06010951492, "speed/FLOPS": 244090987256219.1, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04550617188215256, "optim/lr": 1.3592966562082643e-05, "optim/total_tokens": 1972740554752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2837636470794678, "created_at": "2025-06-03T07:58:48.398309+00:00"} {"global_step": 235170, "acc_step": 0, "speed/wps": 5519.277267194032, "speed/FLOPS": 243923804987978.06, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046289488673210144, "optim/lr": 1.3589419336988097e-05, "optim/total_tokens": 1972748943360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.277677297592163, "created_at": "2025-06-03T07:58:51.374827+00:00"} {"global_step": 235171, "acc_step": 0, "speed/wps": 5512.143709954857, "speed/FLOPS": 243608538270862.44, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047629453241825104, "optim/lr": 1.358587211189377e-05, "optim/total_tokens": 1972757331968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2754756212234497, "created_at": "2025-06-03T07:58:54.351973+00:00"} {"global_step": 235172, "acc_step": 0, "speed/wps": 5523.076924235111, "speed/FLOPS": 244091730380785.97, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04639240354299545, "optim/lr": 1.3582324886799224e-05, "optim/total_tokens": 1972765720576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2608146667480469, "created_at": "2025-06-03T07:58:57.322745+00:00"} {"global_step": 235173, "acc_step": 0, "speed/wps": 5523.052457981977, "speed/FLOPS": 244090649097627.06, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05067617446184158, "optim/lr": 1.3578777661704678e-05, "optim/total_tokens": 1972774109184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2889864444732666, "created_at": "2025-06-03T07:59:00.298229+00:00"} {"global_step": 235174, "acc_step": 0, "speed/wps": 5523.908576714734, "speed/FLOPS": 244128485163602.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04688640683889389, "optim/lr": 1.3575230436610131e-05, "optim/total_tokens": 1972782497792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2700992822647095, "created_at": "2025-06-03T07:59:03.269077+00:00"} {"global_step": 235175, "acc_step": 0, "speed/wps": 5512.499076410907, "speed/FLOPS": 243624243649289.44, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0471009686589241, "optim/lr": 1.3571683211515807e-05, "optim/total_tokens": 1972790886400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.251967191696167, "created_at": "2025-06-03T07:59:06.246500+00:00"} {"global_step": 235176, "acc_step": 0, "speed/wps": 5512.470213612839, "speed/FLOPS": 243622968061348.03, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04625263810157776, "optim/lr": 1.3568135986421259e-05, "optim/total_tokens": 1972799275008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2564890384674072, "created_at": "2025-06-03T07:59:09.223126+00:00"} {"global_step": 235177, "acc_step": 0, "speed/wps": 5516.067403894374, "speed/FLOPS": 243781945459702.94, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04973636940121651, "optim/lr": 1.3564588761326712e-05, "optim/total_tokens": 1972807663616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2686067819595337, "created_at": "2025-06-03T07:59:12.197740+00:00"} {"global_step": 235178, "acc_step": 0, "speed/wps": 5508.875285201871, "speed/FLOPS": 243464090626094.88, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.16 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.16, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045895904302597046, "optim/lr": 1.3561041536232166e-05, "optim/total_tokens": 1972816052224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2667492628097534, "created_at": "2025-06-03T07:59:15.176600+00:00"} {"global_step": 235179, "acc_step": 0, "speed/wps": 5508.431565465389, "speed/FLOPS": 243444480484905.9, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04615350440144539, "optim/lr": 1.3557494311137841e-05, "optim/total_tokens": 1972824440832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2682397365570068, "created_at": "2025-06-03T07:59:18.156581+00:00"} {"global_step": 235180, "acc_step": 0, "speed/wps": 5514.322871589534, "speed/FLOPS": 243704846061154.78, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048000212758779526, "optim/lr": 1.3553947086043295e-05, "optim/total_tokens": 1972832829440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2674546241760254, "created_at": "2025-06-03T07:59:21.135392+00:00"} {"global_step": 235181, "acc_step": 0, "speed/wps": 5510.496661917022, "speed/FLOPS": 243535747177946.22, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.15 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.15, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046079035848379135, "optim/lr": 1.3550399860948747e-05, "optim/total_tokens": 1972841218048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2574008703231812, "created_at": "2025-06-03T07:59:24.113405+00:00"} {"global_step": 235182, "acc_step": 0, "speed/wps": 5523.72407115845, "speed/FLOPS": 244120330962399.34, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05029916763305664, "optim/lr": 1.35468526358542e-05, "optim/total_tokens": 1972849606656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.251813292503357, "created_at": "2025-06-03T07:59:27.084279+00:00"} {"global_step": 235183, "acc_step": 0, "speed/wps": 5523.273950931152, "speed/FLOPS": 244100437952276.94, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04681379348039627, "optim/lr": 1.3543305410759876e-05, "optim/total_tokens": 1972857995264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2819699048995972, "created_at": "2025-06-03T07:59:30.056840+00:00"} {"global_step": 235184, "acc_step": 0, "speed/wps": 5524.876197856433, "speed/FLOPS": 244171249065331.12, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04628059267997742, "optim/lr": 1.353975818566533e-05, "optim/total_tokens": 1972866383872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.277125597000122, "created_at": "2025-06-03T07:59:33.028741+00:00"} {"global_step": 235185, "acc_step": 0, "speed/wps": 5525.798579955881, "speed/FLOPS": 244212013632947.2, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04569735378026962, "optim/lr": 1.3536210960570783e-05, "optim/total_tokens": 1972874772480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2734434604644775, "created_at": "2025-06-03T07:59:35.998453+00:00"} {"global_step": 235186, "acc_step": 0, "speed/wps": 5527.123509716768, "speed/FLOPS": 244270568746773.12, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046648018062114716, "optim/lr": 1.3532663735476235e-05, "optim/total_tokens": 1972883161088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2522748708724976, "created_at": "2025-06-03T07:59:38.970806+00:00"} {"global_step": 235187, "acc_step": 0, "speed/wps": 5523.674764055336, "speed/FLOPS": 244118151840818.3, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04785402491688728, "optim/lr": 1.352911651038191e-05, "optim/total_tokens": 1972891549696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.255858302116394, "created_at": "2025-06-03T07:59:41.944456+00:00"} {"global_step": 235188, "acc_step": 0, "speed/wps": 5528.2600619006425, "speed/FLOPS": 244320798535898.94, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048318177461624146, "optim/lr": 1.3525569285287364e-05, "optim/total_tokens": 1972899938304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2577435970306396, "created_at": "2025-06-03T07:59:44.912710+00:00"} {"global_step": 235189, "acc_step": 0, "speed/wps": 5527.116877974084, "speed/FLOPS": 244270275657690.8, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04619082063436508, "optim/lr": 1.3522022060192818e-05, "optim/total_tokens": 1972908326912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2751859426498413, "created_at": "2025-06-03T07:59:47.881423+00:00"} {"global_step": 235190, "acc_step": 0, "speed/wps": 5518.330915244461, "speed/FLOPS": 243881981075675.4, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047987114638090134, "optim/lr": 1.3518474835098272e-05, "optim/total_tokens": 1972916715520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.271878957748413, "created_at": "2025-06-03T07:59:50.858145+00:00"} {"global_step": 235191, "acc_step": 0, "speed/wps": 5526.2079775182765, "speed/FLOPS": 244230106909718.38, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04588121175765991, "optim/lr": 1.3514927610003947e-05, "optim/total_tokens": 1972925104128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2653298377990723, "created_at": "2025-06-03T07:59:53.827202+00:00"} {"global_step": 235192, "acc_step": 0, "speed/wps": 5525.321521938979, "speed/FLOPS": 244190930110404.38, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0465829074382782, "optim/lr": 1.3511380384909399e-05, "optim/total_tokens": 1972933492736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2637444734573364, "created_at": "2025-06-03T07:59:56.796929+00:00"} {"global_step": 235193, "acc_step": 0, "speed/wps": 5522.887585190246, "speed/FLOPS": 244083362564128.03, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047448355704545975, "optim/lr": 1.3507833159814853e-05, "optim/total_tokens": 1972941881344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.274621844291687, "created_at": "2025-06-03T07:59:59.769598+00:00"} {"global_step": 235194, "acc_step": 0, "speed/wps": 5524.698423609235, "speed/FLOPS": 244163392353536.1, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04882378131151199, "optim/lr": 1.3504285934720306e-05, "optim/total_tokens": 1972950269952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2651702165603638, "created_at": "2025-06-03T08:00:02.744417+00:00"} {"global_step": 235195, "acc_step": 0, "speed/wps": 5506.827015432166, "speed/FLOPS": 243373567586269.03, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04586520045995712, "optim/lr": 1.3500738709625982e-05, "optim/total_tokens": 1972958658560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2588140964508057, "created_at": "2025-06-03T08:00:05.729196+00:00"} {"global_step": 235196, "acc_step": 0, "speed/wps": 5512.3710521372495, "speed/FLOPS": 243618585631681.44, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0473441481590271, "optim/lr": 1.3497191484531435e-05, "optim/total_tokens": 1972967047168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2614531517028809, "created_at": "2025-06-03T08:00:08.712843+00:00"} {"global_step": 235197, "acc_step": 0, "speed/wps": 5509.900828122665, "speed/FLOPS": 243509414373989.5, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04953030124306679, "optim/lr": 1.3493644259436887e-05, "optim/total_tokens": 1972975435776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.267284631729126, "created_at": "2025-06-03T08:00:11.696719+00:00"} {"global_step": 235198, "acc_step": 0, "speed/wps": 5505.096681077736, "speed/FLOPS": 243297095664457.34, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.14 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.14, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04603201523423195, "optim/lr": 1.3490097034342563e-05, "optim/total_tokens": 1972983824384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.266595721244812, "created_at": "2025-06-03T08:00:14.680443+00:00"} {"global_step": 235199, "acc_step": 0, "speed/wps": 5524.640894927478, "speed/FLOPS": 244160849880260.94, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046911194920539856, "optim/lr": 1.3486549809248016e-05, "optim/total_tokens": 1972992212992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.263303279876709, "created_at": "2025-06-03T08:00:17.653959+00:00"} {"global_step": 235200, "acc_step": 0, "speed/wps": 5523.5984503034315, "speed/FLOPS": 244114779163593.34, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04624542221426964, "optim/lr": 1.348300258415347e-05, "optim/total_tokens": 1973000601600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2655158042907715, "created_at": "2025-06-03T08:00:20.625982+00:00"} {"global_step": 235201, "acc_step": 0, "speed/wps": 5514.48047379245, "speed/FLOPS": 243711811271842.47, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04640677571296692, "optim/lr": 1.3479455359058924e-05, "optim/total_tokens": 1973008990208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.270668625831604, "created_at": "2025-06-03T08:00:23.602491+00:00"} {"global_step": 235202, "acc_step": 0, "speed/wps": 5521.4282346433265, "speed/FLOPS": 244018866739587.44, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04684719815850258, "optim/lr": 1.34759081339646e-05, "optim/total_tokens": 1973017378816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.267845869064331, "created_at": "2025-06-03T08:00:26.574826+00:00"} {"global_step": 235203, "acc_step": 0, "speed/wps": 5516.826699584349, "speed/FLOPS": 243815502442772.16, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047837384045124054, "optim/lr": 1.3472360908870051e-05, "optim/total_tokens": 1973025767424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2567336559295654, "created_at": "2025-06-03T08:00:29.552233+00:00"} {"global_step": 235204, "acc_step": 0, "speed/wps": 5511.504117778794, "speed/FLOPS": 243580271570410.0, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05165480449795723, "optim/lr": 1.3468813683775505e-05, "optim/total_tokens": 1973034156032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2606284618377686, "created_at": "2025-06-03T08:00:32.533485+00:00"} {"global_step": 235205, "acc_step": 0, "speed/wps": 5510.94606054225, "speed/FLOPS": 243555608296950.62, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.13 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.13, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046341508626937866, "optim/lr": 1.3465266458680958e-05, "optim/total_tokens": 1973042544640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2644377946853638, "created_at": "2025-06-03T08:00:35.511289+00:00"} {"global_step": 235206, "acc_step": 0, "speed/wps": 5531.883830272255, "speed/FLOPS": 244480950549796.25, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.052900731563568115, "optim/lr": 1.3461719233586634e-05, "optim/total_tokens": 1973050933248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2790415287017822, "created_at": "2025-06-03T08:00:38.481356+00:00"} {"global_step": 235207, "acc_step": 0, "speed/wps": 5527.68996598212, "speed/FLOPS": 244295603214315.66, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04686720669269562, "optim/lr": 1.3458172008492087e-05, "optim/total_tokens": 1973059321856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2644919157028198, "created_at": "2025-06-03T08:00:41.450151+00:00"} {"global_step": 235208, "acc_step": 0, "speed/wps": 5533.182620912775, "speed/FLOPS": 244538350448294.1, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04763149097561836, "optim/lr": 1.345462478339754e-05, "optim/total_tokens": 1973067710464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2753055095672607, "created_at": "2025-06-03T08:00:44.415503+00:00"} {"global_step": 235209, "acc_step": 0, "speed/wps": 5518.987628815755, "speed/FLOPS": 243911004454161.8, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045647624880075455, "optim/lr": 1.3451077558302993e-05, "optim/total_tokens": 1973076099072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2580764293670654, "created_at": "2025-06-03T08:00:47.389340+00:00"} {"global_step": 235210, "acc_step": 0, "speed/wps": 5518.787814431487, "speed/FLOPS": 243902173681119.94, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047574225813150406, "optim/lr": 1.3447530333208668e-05, "optim/total_tokens": 1973084487680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2639473676681519, "created_at": "2025-06-03T08:00:50.362702+00:00"} {"global_step": 235211, "acc_step": 0, "speed/wps": 5518.962469863271, "speed/FLOPS": 243909892557237.22, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04617830738425255, "optim/lr": 1.3443983108114122e-05, "optim/total_tokens": 1973092876288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2615028619766235, "created_at": "2025-06-03T08:00:53.336111+00:00"} {"global_step": 235212, "acc_step": 0, "speed/wps": 5515.63303639471, "speed/FLOPS": 243762748639512.2, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04597872123122215, "optim/lr": 1.3440435883019576e-05, "optim/total_tokens": 1973101264896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2777328491210938, "created_at": "2025-06-03T08:00:56.315091+00:00"} {"global_step": 235213, "acc_step": 0, "speed/wps": 5519.155749175021, "speed/FLOPS": 243918434513523.38, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04683852940797806, "optim/lr": 1.3436888657925028e-05, "optim/total_tokens": 1973109653504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2603378295898438, "created_at": "2025-06-03T08:00:59.288531+00:00"} {"global_step": 235214, "acc_step": 0, "speed/wps": 5519.646107571112, "speed/FLOPS": 243940105844748.8, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045897360891103745, "optim/lr": 1.3433341432830703e-05, "optim/total_tokens": 1973118042112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2560827732086182, "created_at": "2025-06-03T08:01:02.261691+00:00"} {"global_step": 235215, "acc_step": 0, "speed/wps": 5530.393773483271, "speed/FLOPS": 244415097666525.16, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04512811452150345, "optim/lr": 1.3429794207736157e-05, "optim/total_tokens": 1973126430720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2816601991653442, "created_at": "2025-06-03T08:01:05.231351+00:00"} {"global_step": 235216, "acc_step": 0, "speed/wps": 5522.220651558044, "speed/FLOPS": 244053887511260.47, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0468834787607193, "optim/lr": 1.342624698264161e-05, "optim/total_tokens": 1973134819328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2813224792480469, "created_at": "2025-06-03T08:01:08.203030+00:00"} {"global_step": 235217, "acc_step": 0, "speed/wps": 5527.088816102102, "speed/FLOPS": 244269035466582.9, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.62, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045665208250284195, "optim/lr": 1.3422699757547064e-05, "optim/total_tokens": 1973143207936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2631566524505615, "created_at": "2025-06-03T08:01:11.176839+00:00"} {"global_step": 235218, "acc_step": 0, "speed/wps": 5528.086055643306, "speed/FLOPS": 244313108349969.44, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04582367464900017, "optim/lr": 1.3419152532452738e-05, "optim/total_tokens": 1973151596544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2627617120742798, "created_at": "2025-06-03T08:01:14.148872+00:00"} {"global_step": 235219, "acc_step": 0, "speed/wps": 5511.854163542121, "speed/FLOPS": 243595741801452.4, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04634576663374901, "optim/lr": 1.3415605307358191e-05, "optim/total_tokens": 1973159985152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2925845384597778, "created_at": "2025-06-03T08:01:17.129206+00:00"} {"global_step": 235220, "acc_step": 0, "speed/wps": 5522.156607923757, "speed/FLOPS": 244051057110430.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04614598676562309, "optim/lr": 1.3412058082263645e-05, "optim/total_tokens": 1973168373760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2696908712387085, "created_at": "2025-06-03T08:01:20.102192+00:00"} {"global_step": 235221, "acc_step": 0, "speed/wps": 5524.769251206404, "speed/FLOPS": 244166522570802.47, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045669641345739365, "optim/lr": 1.3408510857169099e-05, "optim/total_tokens": 1973176762368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2640926837921143, "created_at": "2025-06-03T08:01:23.072428+00:00"} {"global_step": 235222, "acc_step": 0, "speed/wps": 5512.381729199931, "speed/FLOPS": 243619057503201.78, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.12 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.12, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04613153263926506, "optim/lr": 1.3404963632074774e-05, "optim/total_tokens": 1973185150976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2740565538406372, "created_at": "2025-06-03T08:01:26.050046+00:00"} {"global_step": 235223, "acc_step": 0, "speed/wps": 5525.360447718181, "speed/FLOPS": 244192650430604.9, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045645687729120255, "optim/lr": 1.3401416406980228e-05, "optim/total_tokens": 1973193539584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2728331089019775, "created_at": "2025-06-03T08:01:29.019957+00:00"} {"global_step": 235224, "acc_step": 0, "speed/wps": 5533.674274900903, "speed/FLOPS": 244560079038056.1, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04681345820426941, "optim/lr": 1.339786918188568e-05, "optim/total_tokens": 1973201928192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2823116779327393, "created_at": "2025-06-03T08:01:31.987811+00:00"} {"global_step": 235225, "acc_step": 0, "speed/wps": 5527.959820724226, "speed/FLOPS": 244307529412674.97, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046983975917100906, "optim/lr": 1.3394321956791355e-05, "optim/total_tokens": 1973210316800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2706313133239746, "created_at": "2025-06-03T08:01:34.956145+00:00"} {"global_step": 235226, "acc_step": 0, "speed/wps": 5517.486539018213, "speed/FLOPS": 243844663968384.56, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04630853235721588, "optim/lr": 1.3390774731696809e-05, "optim/total_tokens": 1973218705408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2781168222427368, "created_at": "2025-06-03T08:01:37.930615+00:00"} {"global_step": 235227, "acc_step": 0, "speed/wps": 5525.869742988136, "speed/FLOPS": 244215158674727.44, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04719962179660797, "optim/lr": 1.3387227506602262e-05, "optim/total_tokens": 1973227094016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2718777656555176, "created_at": "2025-06-03T08:01:40.900703+00:00"} {"global_step": 235228, "acc_step": 0, "speed/wps": 5529.584967106918, "speed/FLOPS": 244379352564536.72, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0474158376455307, "optim/lr": 1.3383680281507716e-05, "optim/total_tokens": 1973235482624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2843295335769653, "created_at": "2025-06-03T08:01:43.872778+00:00"} {"global_step": 235229, "acc_step": 0, "speed/wps": 5531.36916225359, "speed/FLOPS": 244458204857680.97, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0471937358379364, "optim/lr": 1.338013305641339e-05, "optim/total_tokens": 1973243871232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2646706104278564, "created_at": "2025-06-03T08:01:46.840193+00:00"} {"global_step": 235230, "acc_step": 0, "speed/wps": 5514.233893855832, "speed/FLOPS": 243700913700754.5, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.11 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.11, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048323359340429306, "optim/lr": 1.3376585831318843e-05, "optim/total_tokens": 1973252259840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2646937370300293, "created_at": "2025-06-03T08:01:49.816280+00:00"} {"global_step": 235231, "acc_step": 0, "speed/wps": 5529.372938626634, "speed/FLOPS": 244369981990968.28, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046319372951984406, "optim/lr": 1.3373038606224297e-05, "optim/total_tokens": 1973260648448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2536664009094238, "created_at": "2025-06-03T08:01:52.787682+00:00"} {"global_step": 235232, "acc_step": 0, "speed/wps": 5530.616836291101, "speed/FLOPS": 244424955900892.3, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047192640602588654, "optim/lr": 1.336949138112975e-05, "optim/total_tokens": 1973269037056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2685109376907349, "created_at": "2025-06-03T08:01:55.758024+00:00"} {"global_step": 235233, "acc_step": 0, "speed/wps": 5525.681105384978, "speed/FLOPS": 244206821858202.62, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046193890273571014, "optim/lr": 1.3365944156035426e-05, "optim/total_tokens": 1973277425664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.263192892074585, "created_at": "2025-06-03T08:01:58.731700+00:00"} {"global_step": 235234, "acc_step": 0, "speed/wps": 5524.635651029958, "speed/FLOPS": 244160618126831.25, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.050504349172115326, "optim/lr": 1.3362396930940878e-05, "optim/total_tokens": 1973285814272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2764182090759277, "created_at": "2025-06-03T08:02:01.706261+00:00"} {"global_step": 235235, "acc_step": 0, "speed/wps": 5522.296463536457, "speed/FLOPS": 244057238012665.47, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04586341977119446, "optim/lr": 1.3358849705846332e-05, "optim/total_tokens": 1973294202880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2681057453155518, "created_at": "2025-06-03T08:02:04.678787+00:00"} {"global_step": 235236, "acc_step": 0, "speed/wps": 5525.684044206023, "speed/FLOPS": 244206951739050.56, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.059358444064855576, "optim/lr": 1.3355302480751785e-05, "optim/total_tokens": 1973302591488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2769582271575928, "created_at": "2025-06-03T08:02:07.648081+00:00"} {"global_step": 235237, "acc_step": 0, "speed/wps": 5516.622895875353, "speed/FLOPS": 243806495361996.47, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04626380652189255, "optim/lr": 1.335175525565746e-05, "optim/total_tokens": 1973310980096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2620617151260376, "created_at": "2025-06-03T08:02:10.622571+00:00"} {"global_step": 235238, "acc_step": 0, "speed/wps": 5525.180425033573, "speed/FLOPS": 244184694349384.88, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05804163217544556, "optim/lr": 1.3348208030562914e-05, "optim/total_tokens": 1973319368704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2647606134414673, "created_at": "2025-06-03T08:02:13.594206+00:00"} {"global_step": 235239, "acc_step": 0, "speed/wps": 5506.465747189074, "speed/FLOPS": 243357601379062.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04858586564660072, "optim/lr": 1.3344660805468366e-05, "optim/total_tokens": 1973327757312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2684496641159058, "created_at": "2025-06-03T08:02:16.577644+00:00"} {"global_step": 235240, "acc_step": 0, "speed/wps": 5527.175832276158, "speed/FLOPS": 244272881136087.0, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05111193656921387, "optim/lr": 1.334111358037382e-05, "optim/total_tokens": 1973336145920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.265467643737793, "created_at": "2025-06-03T08:02:19.546728+00:00"} {"global_step": 235241, "acc_step": 0, "speed/wps": 5528.154959794948, "speed/FLOPS": 244316153560788.56, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05129639804363251, "optim/lr": 1.3337566355279495e-05, "optim/total_tokens": 1973344534528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2804099321365356, "created_at": "2025-06-03T08:02:22.514965+00:00"} {"global_step": 235242, "acc_step": 0, "speed/wps": 5532.24463460681, "speed/FLOPS": 244496896254619.56, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04575596749782562, "optim/lr": 1.3334019130184949e-05, "optim/total_tokens": 1973352923136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2796783447265625, "created_at": "2025-06-03T08:02:25.483752+00:00"} {"global_step": 235243, "acc_step": 0, "speed/wps": 5520.402750623546, "speed/FLOPS": 243973545594816.16, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.061891667544841766, "optim/lr": 1.3330471905090403e-05, "optim/total_tokens": 1973361311744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2620279788970947, "created_at": "2025-06-03T08:02:28.459567+00:00"} {"global_step": 235244, "acc_step": 0, "speed/wps": 5537.800516242756, "speed/FLOPS": 244742437785348.25, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046361297369003296, "optim/lr": 1.3326924679995855e-05, "optim/total_tokens": 1973369700352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2674534320831299, "created_at": "2025-06-03T08:02:31.423268+00:00"} {"global_step": 235245, "acc_step": 0, "speed/wps": 5522.688061747088, "speed/FLOPS": 244074544649194.0, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05239809677004814, "optim/lr": 1.332337745490153e-05, "optim/total_tokens": 1973378088960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2566858530044556, "created_at": "2025-06-03T08:02:34.394904+00:00"} {"global_step": 235246, "acc_step": 0, "speed/wps": 5516.339880712221, "speed/FLOPS": 243793987540389.0, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04677177593111992, "optim/lr": 1.3319830229806984e-05, "optim/total_tokens": 1973386477568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2629259824752808, "created_at": "2025-06-03T08:02:37.369426+00:00"} {"global_step": 235247, "acc_step": 0, "speed/wps": 5517.71416422334, "speed/FLOPS": 243854723837359.75, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05028745159506798, "optim/lr": 1.3316283004712437e-05, "optim/total_tokens": 1973394866176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2666645050048828, "created_at": "2025-06-03T08:02:40.346630+00:00"} {"global_step": 235248, "acc_step": 0, "speed/wps": 5512.811059027204, "speed/FLOPS": 243638031684057.97, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.1 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.1, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.06389732658863068, "optim/lr": 1.3312735779617891e-05, "optim/total_tokens": 1973403254784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.271181583404541, "created_at": "2025-06-03T08:02:43.327461+00:00"} {"global_step": 235249, "acc_step": 0, "speed/wps": 5531.31724636553, "speed/FLOPS": 244455910441158.34, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04618864506483078, "optim/lr": 1.3309188554523566e-05, "optim/total_tokens": 1973411643392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2585088014602661, "created_at": "2025-06-03T08:02:46.294195+00:00"} {"global_step": 235250, "acc_step": 0, "speed/wps": 5533.137035232058, "speed/FLOPS": 244536335794535.06, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045800697058439255, "optim/lr": 1.3305641329429018e-05, "optim/total_tokens": 1973420032000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2766788005828857, "created_at": "2025-06-03T08:02:49.260270+00:00"} {"global_step": 235251, "acc_step": 0, "speed/wps": 5529.381753849557, "speed/FLOPS": 244370371578701.06, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046303726732730865, "optim/lr": 1.3302094104334472e-05, "optim/total_tokens": 1973428420608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2499816417694092, "created_at": "2025-06-03T08:02:52.232311+00:00"} {"global_step": 235252, "acc_step": 0, "speed/wps": 5529.698001672014, "speed/FLOPS": 244384348113750.56, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045333392918109894, "optim/lr": 1.3298546879240148e-05, "optim/total_tokens": 1973436809216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2637370824813843, "created_at": "2025-06-03T08:02:55.205046+00:00"} {"global_step": 235253, "acc_step": 0, "speed/wps": 5519.852186214643, "speed/FLOPS": 243949213465986.75, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04638345539569855, "optim/lr": 1.3294999654145601e-05, "optim/total_tokens": 1973445197824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2727510929107666, "created_at": "2025-06-03T08:02:58.179896+00:00"} {"global_step": 235254, "acc_step": 0, "speed/wps": 5530.133637334482, "speed/FLOPS": 244403600980246.22, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0463288240134716, "optim/lr": 1.3291452429051055e-05, "optim/total_tokens": 1973453586432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.274721622467041, "created_at": "2025-06-03T08:03:01.147645+00:00"} {"global_step": 235255, "acc_step": 0, "speed/wps": 5517.560563669052, "speed/FLOPS": 243847935479059.12, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047071442008018494, "optim/lr": 1.3287905203956507e-05, "optim/total_tokens": 1973461975040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2629444599151611, "created_at": "2025-06-03T08:03:04.121816+00:00"} {"global_step": 235256, "acc_step": 0, "speed/wps": 5517.048969904925, "speed/FLOPS": 243825325653259.0, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04627739638090134, "optim/lr": 1.3284357978862182e-05, "optim/total_tokens": 1973470363648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.264768362045288, "created_at": "2025-06-03T08:03:07.096206+00:00"} {"global_step": 235257, "acc_step": 0, "speed/wps": 5520.283948961203, "speed/FLOPS": 243968295169422.66, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0465194396674633, "optim/lr": 1.3280810753767636e-05, "optim/total_tokens": 1973478752256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2811195850372314, "created_at": "2025-06-03T08:03:10.069981+00:00"} {"global_step": 235258, "acc_step": 0, "speed/wps": 5525.450627027184, "speed/FLOPS": 244196635894483.3, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04685472324490547, "optim/lr": 1.327726352867309e-05, "optim/total_tokens": 1973487140864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.274363398551941, "created_at": "2025-06-03T08:03:13.040303+00:00"} {"global_step": 235259, "acc_step": 0, "speed/wps": 5524.355575873055, "speed/FLOPS": 244148240238450.75, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.06650122255086899, "optim/lr": 1.3273716303578543e-05, "optim/total_tokens": 1973495529472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2606837749481201, "created_at": "2025-06-03T08:03:16.014315+00:00"} {"global_step": 235260, "acc_step": 0, "speed/wps": 5525.187857742531, "speed/FLOPS": 244185022837076.78, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04716658592224121, "optim/lr": 1.3270169078484219e-05, "optim/total_tokens": 1973503918080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.278403878211975, "created_at": "2025-06-03T08:03:18.987525+00:00"} {"global_step": 235261, "acc_step": 0, "speed/wps": 5520.913439294577, "speed/FLOPS": 243996115420134.16, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046229038387537, "optim/lr": 1.326662185338967e-05, "optim/total_tokens": 1973512306688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2731468677520752, "created_at": "2025-06-03T08:03:21.960007+00:00"} {"global_step": 235262, "acc_step": 0, "speed/wps": 5511.2538022086055, "speed/FLOPS": 243569208903438.9, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.09 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.09, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04592350870370865, "optim/lr": 1.3263074628295124e-05, "optim/total_tokens": 1973520695296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2669458389282227, "created_at": "2025-06-03T08:03:24.940053+00:00"} {"global_step": 235263, "acc_step": 0, "speed/wps": 5519.818730792524, "speed/FLOPS": 243947734907569.47, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04592747613787651, "optim/lr": 1.3259527403200578e-05, "optim/total_tokens": 1973529083904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2516056299209595, "created_at": "2025-06-03T08:03:27.917528+00:00"} {"global_step": 235264, "acc_step": 0, "speed/wps": 5519.453813018659, "speed/FLOPS": 243931607409783.16, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04662005230784416, "optim/lr": 1.3255980178106253e-05, "optim/total_tokens": 1973537472512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.262191653251648, "created_at": "2025-06-03T08:03:30.892834+00:00"} {"global_step": 235265, "acc_step": 0, "speed/wps": 5517.849567250416, "speed/FLOPS": 243860707958101.0, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04594958573579788, "optim/lr": 1.3252432953011707e-05, "optim/total_tokens": 1973545861120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2709308862686157, "created_at": "2025-06-03T08:03:33.870656+00:00"} {"global_step": 235266, "acc_step": 0, "speed/wps": 5544.338065519987, "speed/FLOPS": 245031364001191.25, "speed/curr_iter_time": 2.9528, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9528, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 192.97, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04614071547985077, "optim/lr": 1.3248885727917159e-05, "optim/total_tokens": 1973554249728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.266512393951416, "created_at": "2025-06-03T08:03:36.830536+00:00"} {"global_step": 235267, "acc_step": 0, "speed/wps": 5533.051417924879, "speed/FLOPS": 244532551947786.88, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045784518122673035, "optim/lr": 1.3245338502822612e-05, "optim/total_tokens": 1973562638336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2647383213043213, "created_at": "2025-06-03T08:03:39.798555+00:00"} {"global_step": 235268, "acc_step": 0, "speed/wps": 5534.367334927023, "speed/FLOPS": 244590708743807.8, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046877339482307434, "optim/lr": 1.3241791277728288e-05, "optim/total_tokens": 1973571026944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2675776481628418, "created_at": "2025-06-03T08:03:42.763552+00:00"} {"global_step": 235269, "acc_step": 0, "speed/wps": 5524.551508872475, "speed/FLOPS": 244156899474149.1, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04607657343149185, "optim/lr": 1.3238244052633741e-05, "optim/total_tokens": 1973579415552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2700104713439941, "created_at": "2025-06-03T08:03:45.740028+00:00"} {"global_step": 235270, "acc_step": 0, "speed/wps": 5534.287826204762, "speed/FLOPS": 244587194865246.4, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04579626023769379, "optim/lr": 1.3234696827539195e-05, "optim/total_tokens": 1973587804160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2704781293869019, "created_at": "2025-06-03T08:03:48.705294+00:00"} {"global_step": 235271, "acc_step": 0, "speed/wps": 5516.45251106951, "speed/FLOPS": 243798965225686.75, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046685636043548584, "optim/lr": 1.3231149602444647e-05, "optim/total_tokens": 1973596192768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.273065209388733, "created_at": "2025-06-03T08:03:51.679896+00:00"} {"global_step": 235272, "acc_step": 0, "speed/wps": 5514.583723788443, "speed/FLOPS": 243716374393184.0, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.08 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.08, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04596316069364548, "optim/lr": 1.3227602377350322e-05, "optim/total_tokens": 1973604581376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2756332159042358, "created_at": "2025-06-03T08:03:54.657956+00:00"} {"global_step": 235273, "acc_step": 0, "speed/wps": 5518.7636281079085, "speed/FLOPS": 243901104769414.56, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0478970967233181, "optim/lr": 1.3224055152255776e-05, "optim/total_tokens": 1973612969984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.268621802330017, "created_at": "2025-06-03T08:03:57.631184+00:00"} {"global_step": 235274, "acc_step": 0, "speed/wps": 5530.091015836588, "speed/FLOPS": 244401717328195.9, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046594541519880295, "optim/lr": 1.322050792716123e-05, "optim/total_tokens": 1973621358592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.271437168121338, "created_at": "2025-06-03T08:04:00.601805+00:00"} {"global_step": 235275, "acc_step": 0, "speed/wps": 5515.126259043639, "speed/FLOPS": 243740351674516.47, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045693933963775635, "optim/lr": 1.3216960702066683e-05, "optim/total_tokens": 1973629747200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2755746841430664, "created_at": "2025-06-03T08:04:03.579777+00:00"} {"global_step": 235276, "acc_step": 0, "speed/wps": 5531.13567929407, "speed/FLOPS": 244447886105944.28, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04837033897638321, "optim/lr": 1.3213413476972357e-05, "optim/total_tokens": 1973638135808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2577427625656128, "created_at": "2025-06-03T08:04:06.546652+00:00"} {"global_step": 235277, "acc_step": 0, "speed/wps": 5521.254957533834, "speed/FLOPS": 244011208778260.53, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046925608068704605, "optim/lr": 1.320986625187781e-05, "optim/total_tokens": 1973646524416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.25511634349823, "created_at": "2025-06-03T08:04:09.518434+00:00"} {"global_step": 235278, "acc_step": 0, "speed/wps": 5533.49480746732, "speed/FLOPS": 244552147496089.34, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048888806253671646, "optim/lr": 1.3206319026783264e-05, "optim/total_tokens": 1973654913024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2768430709838867, "created_at": "2025-06-03T08:04:12.483939+00:00"} {"global_step": 235279, "acc_step": 0, "speed/wps": 5509.9484771068755, "speed/FLOPS": 243511520215201.97, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048097871243953705, "optim/lr": 1.320277180168894e-05, "optim/total_tokens": 1973663301632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2665083408355713, "created_at": "2025-06-03T08:04:15.461792+00:00"} {"global_step": 235280, "acc_step": 0, "speed/wps": 5520.776609850333, "speed/FLOPS": 243990068259055.2, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047531433403491974, "optim/lr": 1.3199224576594393e-05, "optim/total_tokens": 1973671690240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2702927589416504, "created_at": "2025-06-03T08:04:18.437288+00:00"} {"global_step": 235281, "acc_step": 0, "speed/wps": 5525.8804559173905, "speed/FLOPS": 244215632131366.75, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04740377515554428, "optim/lr": 1.3195677351499847e-05, "optim/total_tokens": 1973680078848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2680408954620361, "created_at": "2025-06-03T08:04:21.407972+00:00"} {"global_step": 235282, "acc_step": 0, "speed/wps": 5533.514697774776, "speed/FLOPS": 244553026545871.1, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04808175936341286, "optim/lr": 1.3192130126405299e-05, "optim/total_tokens": 1973688467456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.279296636581421, "created_at": "2025-06-03T08:04:24.373560+00:00"} {"global_step": 235283, "acc_step": 0, "speed/wps": 5522.630126332283, "speed/FLOPS": 244071984200399.97, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04605437070131302, "optim/lr": 1.3188582901310975e-05, "optim/total_tokens": 1973696856064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2616692781448364, "created_at": "2025-06-03T08:04:27.345023+00:00"} {"global_step": 235284, "acc_step": 0, "speed/wps": 5524.165696406016, "speed/FLOPS": 244139848537898.8, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04922206327319145, "optim/lr": 1.3185035676216428e-05, "optim/total_tokens": 1973705244672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.267910361289978, "created_at": "2025-06-03T08:04:30.318883+00:00"} {"global_step": 235285, "acc_step": 0, "speed/wps": 5513.489607022438, "speed/FLOPS": 243668020032323.8, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.07 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.07, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04632732272148132, "optim/lr": 1.3181488451121882e-05, "optim/total_tokens": 1973713633280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2756338119506836, "created_at": "2025-06-03T08:04:33.298680+00:00"} {"global_step": 235286, "acc_step": 0, "speed/wps": 5515.603655705135, "speed/FLOPS": 243761450163416.97, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04568890854716301, "optim/lr": 1.3177941226027335e-05, "optim/total_tokens": 1973722021888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2730220556259155, "created_at": "2025-06-03T08:04:36.275108+00:00"} {"global_step": 235287, "acc_step": 0, "speed/wps": 5511.716627510088, "speed/FLOPS": 243589663412809.78, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04930877313017845, "optim/lr": 1.317439400093301e-05, "optim/total_tokens": 1973730410496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2744109630584717, "created_at": "2025-06-03T08:04:39.253997+00:00"} {"global_step": 235288, "acc_step": 0, "speed/wps": 5514.442506233868, "speed/FLOPS": 243710133300088.72, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04662520810961723, "optim/lr": 1.3170846775838463e-05, "optim/total_tokens": 1973738799104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2761300802230835, "created_at": "2025-06-03T08:04:42.230999+00:00"} {"global_step": 235289, "acc_step": 0, "speed/wps": 5519.845080470233, "speed/FLOPS": 243948899428454.34, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04818055033683777, "optim/lr": 1.3167299550743916e-05, "optim/total_tokens": 1973747187712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.269380807876587, "created_at": "2025-06-03T08:04:45.203611+00:00"} {"global_step": 235290, "acc_step": 0, "speed/wps": 5531.903692474528, "speed/FLOPS": 244481828357472.72, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05295996740460396, "optim/lr": 1.316375232564937e-05, "optim/total_tokens": 1973755576320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2683765888214111, "created_at": "2025-06-03T08:04:48.170664+00:00"} {"global_step": 235291, "acc_step": 0, "speed/wps": 5527.044354420588, "speed/FLOPS": 244267070487835.5, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04866720363497734, "optim/lr": 1.3160205100555046e-05, "optim/total_tokens": 1973763964928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2802908420562744, "created_at": "2025-06-03T08:04:51.144140+00:00"} {"global_step": 235292, "acc_step": 0, "speed/wps": 5533.078058545167, "speed/FLOPS": 244533729326844.5, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05159711465239525, "optim/lr": 1.3156657875460497e-05, "optim/total_tokens": 1973772353536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.25687837600708, "created_at": "2025-06-03T08:04:54.112640+00:00"} {"global_step": 235293, "acc_step": 0, "speed/wps": 5520.4009984082495, "speed/FLOPS": 243973468155868.72, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046289294958114624, "optim/lr": 1.3153110650365951e-05, "optim/total_tokens": 1973780742144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.270288348197937, "created_at": "2025-06-03T08:04:57.091393+00:00"} {"global_step": 235294, "acc_step": 0, "speed/wps": 5517.080195690775, "speed/FLOPS": 243826705673165.5, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05122655630111694, "optim/lr": 1.3149563425271405e-05, "optim/total_tokens": 1973789130752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.261782169342041, "created_at": "2025-06-03T08:05:00.066414+00:00"} {"global_step": 235295, "acc_step": 0, "speed/wps": 5513.670219162609, "speed/FLOPS": 243676002164462.66, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.06 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.06, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04965662583708763, "optim/lr": 1.314601620017708e-05, "optim/total_tokens": 1973797519360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2790586948394775, "created_at": "2025-06-03T08:05:03.042882+00:00"} {"global_step": 235296, "acc_step": 0, "speed/wps": 5516.71129679235, "speed/FLOPS": 243810402230050.88, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.050391849130392075, "optim/lr": 1.3142468975082534e-05, "optim/total_tokens": 1973805907968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2738038301467896, "created_at": "2025-06-03T08:05:06.017398+00:00"} {"global_step": 235297, "acc_step": 0, "speed/wps": 5519.263592010202, "speed/FLOPS": 243923200614848.72, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05916326493024826, "optim/lr": 1.3138921749987986e-05, "optim/total_tokens": 1973814296576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2782602310180664, "created_at": "2025-06-03T08:05:08.991023+00:00"} {"global_step": 235298, "acc_step": 0, "speed/wps": 5528.676617439442, "speed/FLOPS": 244339208158589.34, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046159710735082626, "optim/lr": 1.313537452489344e-05, "optim/total_tokens": 1973822685184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2531789541244507, "created_at": "2025-06-03T08:05:11.959946+00:00"} {"global_step": 235299, "acc_step": 0, "speed/wps": 5525.077144855259, "speed/FLOPS": 244180129894139.28, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.06027405709028244, "optim/lr": 1.3131827299799115e-05, "optim/total_tokens": 1973831073792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2698314189910889, "created_at": "2025-06-03T08:05:14.929692+00:00"} {"global_step": 235300, "acc_step": 0, "speed/wps": 5519.398210023765, "speed/FLOPS": 243929150042010.75, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04997972771525383, "optim/lr": 1.3128280074704568e-05, "optim/total_tokens": 1973839462400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.263107180595398, "created_at": "2025-06-03T08:05:17.906520+00:00"} {"global_step": 235301, "acc_step": 0, "speed/wps": 5526.104586014682, "speed/FLOPS": 244225537534465.22, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.054731402546167374, "optim/lr": 1.3124732849610022e-05, "optim/total_tokens": 1973847851008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.260271668434143, "created_at": "2025-06-03T08:05:20.876661+00:00"} {"global_step": 235302, "acc_step": 0, "speed/wps": 5524.371136858827, "speed/FLOPS": 244148927954373.53, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05486763268709183, "optim/lr": 1.3121185624515476e-05, "optim/total_tokens": 1973856239616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.286683201789856, "created_at": "2025-06-03T08:05:23.847865+00:00"} {"global_step": 235303, "acc_step": 0, "speed/wps": 5526.858900948057, "speed/FLOPS": 244258874393586.56, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.62, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04705047234892845, "optim/lr": 1.311763839942115e-05, "optim/total_tokens": 1973864628224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2577059268951416, "created_at": "2025-06-03T08:05:26.816787+00:00"} {"global_step": 235304, "acc_step": 0, "speed/wps": 5528.410085702425, "speed/FLOPS": 244327428820046.28, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.053733356297016144, "optim/lr": 1.3114091174326603e-05, "optim/total_tokens": 1973873016832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2561711072921753, "created_at": "2025-06-03T08:05:29.788255+00:00"} {"global_step": 235305, "acc_step": 0, "speed/wps": 5519.457280748019, "speed/FLOPS": 243931760665671.4, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.05 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.05, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04908980056643486, "optim/lr": 1.3110543949232057e-05, "optim/total_tokens": 1973881405440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.26065194606781, "created_at": "2025-06-03T08:05:32.761381+00:00"} {"global_step": 235306, "acc_step": 0, "speed/wps": 5526.138285191055, "speed/FLOPS": 244227026865572.84, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04586750268936157, "optim/lr": 1.3106996724137732e-05, "optim/total_tokens": 1973889794048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2711060047149658, "created_at": "2025-06-03T08:05:35.733311+00:00"} {"global_step": 235307, "acc_step": 0, "speed/wps": 5536.989407513878, "speed/FLOPS": 244706590931162.7, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0583704337477684, "optim/lr": 1.3103449499043186e-05, "optim/total_tokens": 1973898182656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2795839309692383, "created_at": "2025-06-03T08:05:38.700349+00:00"} {"global_step": 235308, "acc_step": 0, "speed/wps": 5533.909514567075, "speed/FLOPS": 244570475427235.16, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04559272527694702, "optim/lr": 1.3099902273948638e-05, "optim/total_tokens": 1973906571264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.278433918952942, "created_at": "2025-06-03T08:05:41.668745+00:00"} {"global_step": 235309, "acc_step": 0, "speed/wps": 5530.055635246779, "speed/FLOPS": 244400153687220.62, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04929322749376297, "optim/lr": 1.3096355048854091e-05, "optim/total_tokens": 1973914959872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2738906145095825, "created_at": "2025-06-03T08:05:44.636061+00:00"} {"global_step": 235310, "acc_step": 0, "speed/wps": 5529.711571310036, "speed/FLOPS": 244384947822295.44, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04753219708800316, "optim/lr": 1.3092807823759767e-05, "optim/total_tokens": 1973923348480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2670139074325562, "created_at": "2025-06-03T08:05:47.605205+00:00"} {"global_step": 235311, "acc_step": 0, "speed/wps": 5524.8641215650705, "speed/FLOPS": 244170715355065.0, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04573548957705498, "optim/lr": 1.308926059866522e-05, "optim/total_tokens": 1973931737088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2609400749206543, "created_at": "2025-06-03T08:05:50.579744+00:00"} {"global_step": 235312, "acc_step": 0, "speed/wps": 5518.992442129893, "speed/FLOPS": 243911217178009.94, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.049737706780433655, "optim/lr": 1.3085713373570674e-05, "optim/total_tokens": 1973940125696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.289310336112976, "created_at": "2025-06-03T08:05:53.556558+00:00"} {"global_step": 235313, "acc_step": 0, "speed/wps": 5532.015905963663, "speed/FLOPS": 244486787619331.78, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.46, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047828931361436844, "optim/lr": 1.3082166148476126e-05, "optim/total_tokens": 1973948514304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2671985626220703, "created_at": "2025-06-03T08:05:56.523795+00:00"} {"global_step": 235314, "acc_step": 0, "speed/wps": 5516.985291851668, "speed/FLOPS": 243822511409238.84, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05772504210472107, "optim/lr": 1.3078618923381802e-05, "optim/total_tokens": 1973956902912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2768203020095825, "created_at": "2025-06-03T08:05:59.500849+00:00"} {"global_step": 235315, "acc_step": 0, "speed/wps": 5529.754073543718, "speed/FLOPS": 244386826203478.03, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04706912115216255, "optim/lr": 1.3075071698287255e-05, "optim/total_tokens": 1973965291520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2626174688339233, "created_at": "2025-06-03T08:06:02.472288+00:00"} {"global_step": 235316, "acc_step": 0, "speed/wps": 5530.747839511085, "speed/FLOPS": 244430745572680.34, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04661580175161362, "optim/lr": 1.3071524473192709e-05, "optim/total_tokens": 1973973680128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2644641399383545, "created_at": "2025-06-03T08:06:05.442572+00:00"} {"global_step": 235317, "acc_step": 0, "speed/wps": 5535.430143413739, "speed/FLOPS": 244637679438973.7, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047423336654901505, "optim/lr": 1.3067977248098162e-05, "optim/total_tokens": 1973982068736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2646931409835815, "created_at": "2025-06-03T08:06:08.407674+00:00"} {"global_step": 235318, "acc_step": 0, "speed/wps": 5520.845193733292, "speed/FLOPS": 243993099315637.8, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04622270166873932, "optim/lr": 1.3064430023003838e-05, "optim/total_tokens": 1973990457344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2628260850906372, "created_at": "2025-06-03T08:06:11.383594+00:00"} {"global_step": 235319, "acc_step": 0, "speed/wps": 5530.499573171147, "speed/FLOPS": 244419773471197.4, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047118742018938065, "optim/lr": 1.306088279790929e-05, "optim/total_tokens": 1973998845952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.284606695175171, "created_at": "2025-06-03T08:06:14.353011+00:00"} {"global_step": 235320, "acc_step": 0, "speed/wps": 5533.639925014549, "speed/FLOPS": 244558560948897.9, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046169307082891464, "optim/lr": 1.3057335572814743e-05, "optim/total_tokens": 1974007234560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2683532238006592, "created_at": "2025-06-03T08:06:17.318861+00:00"} {"global_step": 235321, "acc_step": 0, "speed/wps": 5520.111882094927, "speed/FLOPS": 243960690694651.28, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04735441878437996, "optim/lr": 1.3053788347720197e-05, "optim/total_tokens": 1974015623168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2690080404281616, "created_at": "2025-06-03T08:06:20.291768+00:00"} {"global_step": 235322, "acc_step": 0, "speed/wps": 5524.273847441476, "speed/FLOPS": 244144628260099.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.81, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04834538325667381, "optim/lr": 1.3050241122625873e-05, "optim/total_tokens": 1974024011776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2599778175354004, "created_at": "2025-06-03T08:06:23.263711+00:00"} {"global_step": 235323, "acc_step": 0, "speed/wps": 5529.431742938672, "speed/FLOPS": 244372580840572.62, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04829536750912666, "optim/lr": 1.3046693897531326e-05, "optim/total_tokens": 1974032400384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2667940855026245, "created_at": "2025-06-03T08:06:26.231536+00:00"} {"global_step": 235324, "acc_step": 0, "speed/wps": 5527.959962727291, "speed/FLOPS": 244307535688483.6, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046412911266088486, "optim/lr": 1.3043146672436778e-05, "optim/total_tokens": 1974040788992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2812384366989136, "created_at": "2025-06-03T08:06:29.200026+00:00"} {"global_step": 235325, "acc_step": 0, "speed/wps": 5530.753558407496, "speed/FLOPS": 244430998318629.72, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.59, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04667279124259949, "optim/lr": 1.3039599447342232e-05, "optim/total_tokens": 1974049177600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2689088582992554, "created_at": "2025-06-03T08:06:32.172333+00:00"} {"global_step": 235326, "acc_step": 0, "speed/wps": 5519.740812886664, "speed/FLOPS": 243944291334950.44, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047147221863269806, "optim/lr": 1.3036052222247907e-05, "optim/total_tokens": 1974057566208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2542856931686401, "created_at": "2025-06-03T08:06:35.145678+00:00"} {"global_step": 235327, "acc_step": 0, "speed/wps": 5515.060325006557, "speed/FLOPS": 243737437727558.44, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046123407781124115, "optim/lr": 1.303250499715336e-05, "optim/total_tokens": 1974065954816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2819637060165405, "created_at": "2025-06-03T08:06:38.124652+00:00"} {"global_step": 235328, "acc_step": 0, "speed/wps": 5518.424845361379, "speed/FLOPS": 243886132306065.28, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04568417742848396, "optim/lr": 1.3028957772058814e-05, "optim/total_tokens": 1974074343424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2679303884506226, "created_at": "2025-06-03T08:06:41.098127+00:00"} {"global_step": 235329, "acc_step": 0, "speed/wps": 5513.640288690789, "speed/FLOPS": 243674679390806.25, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048713892698287964, "optim/lr": 1.3025410546964266e-05, "optim/total_tokens": 1974082732032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2721309661865234, "created_at": "2025-06-03T08:06:44.076929+00:00"} {"global_step": 235330, "acc_step": 0, "speed/wps": 5512.169759721626, "speed/FLOPS": 243609689537218.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.03 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.03, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04706387594342232, "optim/lr": 1.3021863321869942e-05, "optim/total_tokens": 1974091120640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2642946243286133, "created_at": "2025-06-03T08:06:47.057565+00:00"} {"global_step": 235331, "acc_step": 0, "speed/wps": 5496.9212870520305, "speed/FLOPS": 242935785093981.12, "speed/curr_iter_time": 2.9797, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9797, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "3.04 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 3.04, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04540514200925827, "optim/lr": 1.3018316096775395e-05, "optim/total_tokens": 1974099509248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.263952612876892, "created_at": "2025-06-03T08:06:50.046684+00:00"} {"global_step": 235332, "acc_step": 0, "speed/wps": 5535.614405009875, "speed/FLOPS": 244645822858386.53, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.42, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045596856623888016, "optim/lr": 1.3014768871680849e-05, "optim/total_tokens": 1974107897856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.264893651008606, "created_at": "2025-06-03T08:06:53.010541+00:00"} {"global_step": 235333, "acc_step": 0, "speed/wps": 5524.737157999052, "speed/FLOPS": 244165104215305.44, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04645223170518875, "optim/lr": 1.3011221646586525e-05, "optim/total_tokens": 1974116286464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.267695665359497, "created_at": "2025-06-03T08:06:55.985215+00:00"} {"global_step": 235334, "acc_step": 0, "speed/wps": 5522.557076858778, "speed/FLOPS": 244068755787572.12, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04696381464600563, "optim/lr": 1.3007674421491976e-05, "optim/total_tokens": 1974124675072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.260365605354309, "created_at": "2025-06-03T08:06:58.958847+00:00"} {"global_step": 235335, "acc_step": 0, "speed/wps": 5524.687046859865, "speed/FLOPS": 244162889559445.44, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0460505411028862, "optim/lr": 1.300412719639743e-05, "optim/total_tokens": 1974133063680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2649027109146118, "created_at": "2025-06-03T08:07:01.929318+00:00"} {"global_step": 235336, "acc_step": 0, "speed/wps": 5530.261183280787, "speed/FLOPS": 244409237858233.56, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.62, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04670928046107292, "optim/lr": 1.3000579971302884e-05, "optim/total_tokens": 1974141452288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2683565616607666, "created_at": "2025-06-03T08:07:04.900128+00:00"} {"global_step": 235337, "acc_step": 0, "speed/wps": 5534.258336535665, "speed/FLOPS": 244585891572814.12, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.38, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045652516186237335, "optim/lr": 1.299703274620856e-05, "optim/total_tokens": 1974149840896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2673418521881104, "created_at": "2025-06-03T08:07:07.865887+00:00"} {"global_step": 235338, "acc_step": 0, "speed/wps": 5523.697175832218, "speed/FLOPS": 244119142326642.62, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04846687987446785, "optim/lr": 1.2993485521114013e-05, "optim/total_tokens": 1974158229504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2748310565948486, "created_at": "2025-06-03T08:07:10.837973+00:00"} {"global_step": 235339, "acc_step": 0, "speed/wps": 5519.765599651086, "speed/FLOPS": 243945386783067.75, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046070877462625504, "optim/lr": 1.2989938296019466e-05, "optim/total_tokens": 1974166618112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2774040699005127, "created_at": "2025-06-03T08:07:13.815762+00:00"} {"global_step": 235340, "acc_step": 0, "speed/wps": 5523.209604113926, "speed/FLOPS": 244097594152312.4, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.0471247136592865, "optim/lr": 1.2986391070924918e-05, "optim/total_tokens": 1974175006720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2669826745986938, "created_at": "2025-06-03T08:07:16.790063+00:00"} {"global_step": 235341, "acc_step": 0, "speed/wps": 5532.749656437555, "speed/FLOPS": 244519215634602.44, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04574240371584892, "optim/lr": 1.2982843845830594e-05, "optim/total_tokens": 1974183395328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2651809453964233, "created_at": "2025-06-03T08:07:19.758088+00:00"} {"global_step": 235342, "acc_step": 0, "speed/wps": 5527.460819679902, "speed/FLOPS": 244285476120634.72, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04653764143586159, "optim/lr": 1.2979296620736047e-05, "optim/total_tokens": 1974191783936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2742345333099365, "created_at": "2025-06-03T08:07:22.726757+00:00"} {"global_step": 235343, "acc_step": 0, "speed/wps": 5516.185450325091, "speed/FLOPS": 243787162507724.2, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.046934016048908234, "optim/lr": 1.2975749395641501e-05, "optim/total_tokens": 1974200172544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2733099460601807, "created_at": "2025-06-03T08:07:25.701719+00:00"} {"global_step": 235344, "acc_step": 0, "speed/wps": 5532.717104171011, "speed/FLOPS": 244517776991038.78, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.05287882685661316, "optim/lr": 1.2972202170546955e-05, "optim/total_tokens": 1974208561152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2427730560302734, "created_at": "2025-06-03T08:07:28.671049+00:00"} {"global_step": 235345, "acc_step": 0, "speed/wps": 5534.421099245894, "speed/FLOPS": 244593084851511.2, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.045719508081674576, "optim/lr": 1.2968654945452629e-05, "optim/total_tokens": 1974216949760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2546910047531128, "created_at": "2025-06-03T08:07:31.636130+00:00"} {"global_step": 235346, "acc_step": 0, "speed/wps": 5513.315245539081, "speed/FLOPS": 243660314147222.44, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04914826527237892, "optim/lr": 1.2965107720358082e-05, "optim/total_tokens": 1974225338368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2642911672592163, "created_at": "2025-06-03T08:07:34.612472+00:00"} {"global_step": 235347, "acc_step": 0, "speed/wps": 5498.275895413313, "speed/FLOPS": 242995651850035.72, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "3.02 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 3.02, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04892304912209511, "optim/lr": 1.2961560495263536e-05, "optim/total_tokens": 1974233726976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2825241088867188, "created_at": "2025-06-03T08:07:37.596768+00:00"} {"global_step": 235348, "acc_step": 0, "speed/wps": 5533.602087848767, "speed/FLOPS": 244556888739838.53, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.51, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.048268336802721024, "optim/lr": 1.295801327016899e-05, "optim/total_tokens": 1974242115584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2784109115600586, "created_at": "2025-06-03T08:07:40.562238+00:00"} {"global_step": 235349, "acc_step": 0, "speed/wps": 5517.0811282740515, "speed/FLOPS": 243826746888572.94, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04853503406047821, "optim/lr": 1.2954466045074665e-05, "optim/total_tokens": 1974250504192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2742780447006226, "created_at": "2025-06-03T08:07:43.536534+00:00"} {"global_step": 235350, "acc_step": 0, "speed/wps": 5521.668667748119, "speed/FLOPS": 244029492652171.06, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04727422446012497, "optim/lr": 1.2950918819980117e-05, "optim/total_tokens": 1974258892800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2634456157684326, "created_at": "2025-06-03T08:07:46.510477+00:00"} {"global_step": 235351, "acc_step": 0, "speed/wps": 5527.68382311072, "speed/FLOPS": 244295331730841.88, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04731430858373642, "optim/lr": 1.294737159488557e-05, "optim/total_tokens": 1974267281408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.268135666847229, "created_at": "2025-06-03T08:07:49.479039+00:00"} {"global_step": 235352, "acc_step": 0, "speed/wps": 5524.651097784903, "speed/FLOPS": 244161300794336.12, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04643050208687782, "optim/lr": 1.2943824369791024e-05, "optim/total_tokens": 1974275670016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2590134143829346, "created_at": "2025-06-03T08:07:52.449588+00:00"} {"global_step": 235353, "acc_step": 0, "speed/wps": 5515.51962200314, "speed/FLOPS": 243757736303912.28, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04604604095220566, "optim/lr": 1.29402771446967e-05, "optim/total_tokens": 1974284058624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2530207633972168, "created_at": "2025-06-03T08:07:55.424737+00:00"} {"global_step": 235354, "acc_step": 0, "speed/wps": 5530.75432739044, "speed/FLOPS": 244431032303739.88, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046533212065696716, "optim/lr": 1.2936729919602153e-05, "optim/total_tokens": 1974292447232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.275922417640686, "created_at": "2025-06-03T08:07:58.391889+00:00"} {"global_step": 235355, "acc_step": 0, "speed/wps": 5519.497250864465, "speed/FLOPS": 243933527140232.72, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.047597721219062805, "optim/lr": 1.2933182694507605e-05, "optim/total_tokens": 1974300835840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2621148824691772, "created_at": "2025-06-03T08:08:01.365037+00:00"} {"global_step": 235356, "acc_step": 0, "speed/wps": 5513.484603291113, "speed/FLOPS": 243667798893010.7, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.01 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.01, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04596330597996712, "optim/lr": 1.2929635469413059e-05, "optim/total_tokens": 1974309224448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2702361345291138, "created_at": "2025-06-03T08:08:04.341177+00:00"} {"global_step": 235357, "acc_step": 0, "speed/wps": 5534.239424105296, "speed/FLOPS": 244585055740194.44, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.4, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046002838760614395, "optim/lr": 1.2926088244318734e-05, "optim/total_tokens": 1974317613056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2500786781311035, "created_at": "2025-06-03T08:08:07.305970+00:00"} {"global_step": 235358, "acc_step": 0, "speed/wps": 5522.757916306489, "speed/FLOPS": 244077631863171.5, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04676229506731033, "optim/lr": 1.2922541019224188e-05, "optim/total_tokens": 1974326001664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2625499963760376, "created_at": "2025-06-03T08:08:10.277114+00:00"} {"global_step": 235359, "acc_step": 0, "speed/wps": 5533.2254976162785, "speed/FLOPS": 244540245379126.1, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0463503934442997, "optim/lr": 1.2918993794129641e-05, "optim/total_tokens": 1974334390272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2864187955856323, "created_at": "2025-06-03T08:08:13.247242+00:00"} {"global_step": 235360, "acc_step": 0, "speed/wps": 5526.448236379568, "speed/FLOPS": 244240725121631.12, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04504626244306564, "optim/lr": 1.2915446569035317e-05, "optim/total_tokens": 1974342778880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2558882236480713, "created_at": "2025-06-03T08:08:16.216695+00:00"} {"global_step": 235361, "acc_step": 0, "speed/wps": 5528.786950320539, "speed/FLOPS": 244344084307198.94, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0472162701189518, "optim/lr": 1.2911899343940769e-05, "optim/total_tokens": 1974351167488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2590985298156738, "created_at": "2025-06-03T08:08:19.186963+00:00"} {"global_step": 235362, "acc_step": 0, "speed/wps": 5544.000617971163, "speed/FLOPS": 245016450546746.3, "speed/curr_iter_time": 2.9544, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9544, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.15, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04597800225019455, "optim/lr": 1.2908352118846222e-05, "optim/total_tokens": 1974359556096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2561569213867188, "created_at": "2025-06-03T08:08:22.147563+00:00"} {"global_step": 235363, "acc_step": 0, "speed/wps": 5515.66723399205, "speed/FLOPS": 243764259998275.44, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04757098853588104, "optim/lr": 1.2904804893751676e-05, "optim/total_tokens": 1974367944704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2671658992767334, "created_at": "2025-06-03T08:08:25.128513+00:00"} {"global_step": 235364, "acc_step": 0, "speed/wps": 5520.270144069175, "speed/FLOPS": 243967685063854.84, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04621009901165962, "optim/lr": 1.2901257668657352e-05, "optim/total_tokens": 1974376333312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2819161415100098, "created_at": "2025-06-03T08:08:28.104098+00:00"} {"global_step": 235365, "acc_step": 0, "speed/wps": 5515.585030083715, "speed/FLOPS": 243760627006284.75, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "3.0 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 3.0, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04627426713705063, "optim/lr": 1.2897710443562805e-05, "optim/total_tokens": 1974384721920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2664610147476196, "created_at": "2025-06-03T08:08:31.084744+00:00"} {"global_step": 235366, "acc_step": 0, "speed/wps": 5539.044171596372, "speed/FLOPS": 244797400986372.9, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04780353605747223, "optim/lr": 1.2894163218468257e-05, "optim/total_tokens": 1974393110528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.255374550819397, "created_at": "2025-06-03T08:08:34.052171+00:00"} {"global_step": 235367, "acc_step": 0, "speed/wps": 5520.996348332548, "speed/FLOPS": 243999779575245.56, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04943496733903885, "optim/lr": 1.289061599337371e-05, "optim/total_tokens": 1974401499136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2632629871368408, "created_at": "2025-06-03T08:08:37.024508+00:00"} {"global_step": 235368, "acc_step": 0, "speed/wps": 5534.558785654712, "speed/FLOPS": 244599169886038.0, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.49, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05102894455194473, "optim/lr": 1.2887068768279386e-05, "optim/total_tokens": 1974409887744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2684009075164795, "created_at": "2025-06-03T08:08:39.992982+00:00"} {"global_step": 235369, "acc_step": 0, "speed/wps": 5533.110659436397, "speed/FLOPS": 244535170119370.4, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04754814878106117, "optim/lr": 1.288352154318484e-05, "optim/total_tokens": 1974418276352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2746586799621582, "created_at": "2025-06-03T08:08:42.958580+00:00"} {"global_step": 235370, "acc_step": 0, "speed/wps": 5526.270189524552, "speed/FLOPS": 244232856361965.84, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04887819290161133, "optim/lr": 1.2879974318090293e-05, "optim/total_tokens": 1974426664960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2585515975952148, "created_at": "2025-06-03T08:08:45.930907+00:00"} {"global_step": 235371, "acc_step": 0, "speed/wps": 5523.184330356279, "speed/FLOPS": 244096477181587.25, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049317728728055954, "optim/lr": 1.2876427092995745e-05, "optim/total_tokens": 1974435053568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2615927457809448, "created_at": "2025-06-03T08:08:48.901963+00:00"} {"global_step": 235372, "acc_step": 0, "speed/wps": 5532.652601953861, "speed/FLOPS": 244514926323193.06, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0465797483921051, "optim/lr": 1.2872879867901421e-05, "optim/total_tokens": 1974443442176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2640193700790405, "created_at": "2025-06-03T08:08:51.867995+00:00"} {"global_step": 235373, "acc_step": 0, "speed/wps": 5519.375122276126, "speed/FLOPS": 243928129681738.88, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.99 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.99, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.053344108164310455, "optim/lr": 1.2869332642806874e-05, "optim/total_tokens": 1974451830784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2613862752914429, "created_at": "2025-06-03T08:08:54.845678+00:00"} {"global_step": 235374, "acc_step": 0, "speed/wps": 5525.541175474736, "speed/FLOPS": 244200637672396.12, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04741336405277252, "optim/lr": 1.2865785417712328e-05, "optim/total_tokens": 1974460219392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2687156200408936, "created_at": "2025-06-03T08:08:57.815018+00:00"} {"global_step": 235375, "acc_step": 0, "speed/wps": 5533.143838926401, "speed/FLOPS": 244536636483000.56, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046019297093153, "optim/lr": 1.2862238192617782e-05, "optim/total_tokens": 1974468608000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.271822214126587, "created_at": "2025-06-03T08:09:00.780966+00:00"} {"global_step": 235376, "acc_step": 0, "speed/wps": 5530.408804769831, "speed/FLOPS": 244415761972454.0, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048274923115968704, "optim/lr": 1.2858690967523457e-05, "optim/total_tokens": 1974476996608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.268710970878601, "created_at": "2025-06-03T08:09:03.750758+00:00"} {"global_step": 235377, "acc_step": 0, "speed/wps": 5523.603334965555, "speed/FLOPS": 244114995040657.25, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04629695788025856, "optim/lr": 1.2855143742428909e-05, "optim/total_tokens": 1974485385216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2661060094833374, "created_at": "2025-06-03T08:09:06.722570+00:00"} {"global_step": 235378, "acc_step": 0, "speed/wps": 5529.115683706501, "speed/FLOPS": 244358612640248.47, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046670131385326385, "optim/lr": 1.2851596517334363e-05, "optim/total_tokens": 1974493773824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2718312740325928, "created_at": "2025-06-03T08:09:09.690190+00:00"} {"global_step": 235379, "acc_step": 0, "speed/wps": 5531.181122007702, "speed/FLOPS": 244449894441289.94, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046805623918771744, "optim/lr": 1.2848049292239816e-05, "optim/total_tokens": 1974502162432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2628916501998901, "created_at": "2025-06-03T08:09:12.661386+00:00"} {"global_step": 235380, "acc_step": 0, "speed/wps": 5517.684334335304, "speed/FLOPS": 243853405508991.78, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047554682940244675, "optim/lr": 1.2844502067145492e-05, "optim/total_tokens": 1974510551040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2693167924880981, "created_at": "2025-06-03T08:09:15.635936+00:00"} {"global_step": 235381, "acc_step": 0, "speed/wps": 5530.339230718895, "speed/FLOPS": 244412687155514.94, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04701835662126541, "optim/lr": 1.2840954842050945e-05, "optim/total_tokens": 1974518939648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2675379514694214, "created_at": "2025-06-03T08:09:18.602725+00:00"} {"global_step": 235382, "acc_step": 0, "speed/wps": 5531.231707539358, "speed/FLOPS": 244452130062868.9, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04696883261203766, "optim/lr": 1.2837407616956397e-05, "optim/total_tokens": 1974527328256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2746919393539429, "created_at": "2025-06-03T08:09:21.574414+00:00"} {"global_step": 235383, "acc_step": 0, "speed/wps": 5535.4363492347975, "speed/FLOPS": 244637953704500.2, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046597279608249664, "optim/lr": 1.2833860391861851e-05, "optim/total_tokens": 1974535716864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.284414529800415, "created_at": "2025-06-03T08:09:24.542456+00:00"} {"global_step": 235384, "acc_step": 0, "speed/wps": 5531.171211960451, "speed/FLOPS": 244449456467925.66, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.52, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04554818570613861, "optim/lr": 1.2830313166767527e-05, "optim/total_tokens": 1974544105472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2678899765014648, "created_at": "2025-06-03T08:09:27.509339+00:00"} {"global_step": 235385, "acc_step": 0, "speed/wps": 5528.741071288692, "speed/FLOPS": 244342056688821.47, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047061458230018616, "optim/lr": 1.282676594167298e-05, "optim/total_tokens": 1974552494080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.261316180229187, "created_at": "2025-06-03T08:09:30.482371+00:00"} {"global_step": 235386, "acc_step": 0, "speed/wps": 5520.836212527004, "speed/FLOPS": 243992702392289.88, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04980916529893875, "optim/lr": 1.2823218716578434e-05, "optim/total_tokens": 1974560882688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.270499348640442, "created_at": "2025-06-03T08:09:33.457382+00:00"} {"global_step": 235387, "acc_step": 0, "speed/wps": 5525.760506720198, "speed/FLOPS": 244210330990806.47, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0497748926281929, "optim/lr": 1.2819671491484108e-05, "optim/total_tokens": 1974569271296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 425, "loss/out": 1.2851771116256714, "created_at": "2025-06-03T08:09:36.428130+00:00"} {"global_step": 235388, "acc_step": 0, "speed/wps": 5516.277711762869, "speed/FLOPS": 243791239991037.16, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.050678931176662445, "optim/lr": 1.2816124266389561e-05, "optim/total_tokens": 1974577659904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.285174012184143, "created_at": "2025-06-03T08:09:39.403370+00:00"} {"global_step": 235389, "acc_step": 0, "speed/wps": 5523.214496758638, "speed/FLOPS": 244097810382165.88, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04611517861485481, "optim/lr": 1.2812577041295015e-05, "optim/total_tokens": 1974586048512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2701770067214966, "created_at": "2025-06-03T08:09:42.374282+00:00"} {"global_step": 235390, "acc_step": 0, "speed/wps": 5519.438116078018, "speed/FLOPS": 243930913685351.0, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.98 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.98, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04989289492368698, "optim/lr": 1.2809029816200468e-05, "optim/total_tokens": 1974594437120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2540498971939087, "created_at": "2025-06-03T08:09:45.347415+00:00"} {"global_step": 235391, "acc_step": 0, "speed/wps": 5527.469783810445, "speed/FLOPS": 244285872289322.12, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04998651146888733, "optim/lr": 1.2805482591106144e-05, "optim/total_tokens": 1974602825728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.265091061592102, "created_at": "2025-06-03T08:09:48.319429+00:00"} {"global_step": 235392, "acc_step": 0, "speed/wps": 5517.771041658687, "speed/FLOPS": 243857237528877.0, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049015965312719345, "optim/lr": 1.2801935366011598e-05, "optim/total_tokens": 1974611214336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.278818964958191, "created_at": "2025-06-03T08:09:51.293326+00:00"} {"global_step": 235393, "acc_step": 0, "speed/wps": 5542.744251979358, "speed/FLOPS": 244960925600572.66, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.22, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04835302382707596, "optim/lr": 1.279838814091705e-05, "optim/total_tokens": 1974619602944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.257790446281433, "created_at": "2025-06-03T08:09:54.253665+00:00"} {"global_step": 235394, "acc_step": 0, "speed/wps": 5523.1645792707695, "speed/FLOPS": 244095604284702.94, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04621822014451027, "optim/lr": 1.2794840915822503e-05, "optim/total_tokens": 1974627991552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2738893032073975, "created_at": "2025-06-03T08:09:57.224692+00:00"} {"global_step": 235395, "acc_step": 0, "speed/wps": 5523.068186758099, "speed/FLOPS": 244091344229024.5, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05040843039751053, "optim/lr": 1.2791293690728179e-05, "optim/total_tokens": 1974636380160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2603336572647095, "created_at": "2025-06-03T08:10:00.196627+00:00"} {"global_step": 235396, "acc_step": 0, "speed/wps": 5534.059498720715, "speed/FLOPS": 244577103959137.53, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.53, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046285469084978104, "optim/lr": 1.2787746465633632e-05, "optim/total_tokens": 1974644768768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2695033550262451, "created_at": "2025-06-03T08:10:03.162123+00:00"} {"global_step": 235397, "acc_step": 0, "speed/wps": 5511.8271967431865, "speed/FLOPS": 243594550006968.1, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04682504013180733, "optim/lr": 1.2784199240539086e-05, "optim/total_tokens": 1974653157376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2652641534805298, "created_at": "2025-06-03T08:10:06.139944+00:00"} {"global_step": 235398, "acc_step": 0, "speed/wps": 5524.477904152521, "speed/FLOPS": 244153646522270.22, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04718239977955818, "optim/lr": 1.2780652015444538e-05, "optim/total_tokens": 1974661545984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2766457796096802, "created_at": "2025-06-03T08:10:09.114537+00:00"} {"global_step": 235399, "acc_step": 0, "speed/wps": 5525.889474805786, "speed/FLOPS": 244216030720071.0, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04540079087018967, "optim/lr": 1.2777104790350213e-05, "optim/total_tokens": 1974669934592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2668888568878174, "created_at": "2025-06-03T08:10:12.084223+00:00"} {"global_step": 235400, "acc_step": 0, "speed/wps": 5538.862349767225, "speed/FLOPS": 244789365392173.12, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.36, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04724832624197006, "optim/lr": 1.2773557565255667e-05, "optim/total_tokens": 1974678323200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2661679983139038, "created_at": "2025-06-03T08:10:15.046921+00:00"} {"global_step": 235401, "acc_step": 0, "speed/wps": 5535.221162719604, "speed/FLOPS": 244628443561953.06, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.39, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047579266130924225, "optim/lr": 1.277001034016112e-05, "optim/total_tokens": 1974686711808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2692679166793823, "created_at": "2025-06-03T08:10:18.014879+00:00"} {"global_step": 235402, "acc_step": 0, "speed/wps": 5533.5580917848865, "speed/FLOPS": 244554944339007.28, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.55, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04692161828279495, "optim/lr": 1.2766463115066574e-05, "optim/total_tokens": 1974695100416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.269246220588684, "created_at": "2025-06-03T08:10:20.980299+00:00"} {"global_step": 235403, "acc_step": 0, "speed/wps": 5506.285169835303, "speed/FLOPS": 243349620784304.88, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048121266067028046, "optim/lr": 1.2762915889972248e-05, "optim/total_tokens": 1974703489024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2609045505523682, "created_at": "2025-06-03T08:10:23.960251+00:00"} {"global_step": 235404, "acc_step": 0, "speed/wps": 5521.260275159023, "speed/FLOPS": 244011443790075.78, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0461839959025383, "optim/lr": 1.2759368664877701e-05, "optim/total_tokens": 1974711877632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2704545259475708, "created_at": "2025-06-03T08:10:26.932331+00:00"} {"global_step": 235405, "acc_step": 0, "speed/wps": 5523.596526531096, "speed/FLOPS": 244114694142702.88, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04604001343250275, "optim/lr": 1.2755821439783155e-05, "optim/total_tokens": 1974720266240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2561863660812378, "created_at": "2025-06-03T08:10:29.903947+00:00"} {"global_step": 235406, "acc_step": 0, "speed/wps": 5513.033015384741, "speed/FLOPS": 243647841018985.5, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.97 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.97, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04879586771130562, "optim/lr": 1.2752274214688609e-05, "optim/total_tokens": 1974728654848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2642217874526978, "created_at": "2025-06-03T08:10:32.883915+00:00"} {"global_step": 235407, "acc_step": 0, "speed/wps": 5514.185032576211, "speed/FLOPS": 243698754282289.94, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04730841889977455, "optim/lr": 1.2748726989594284e-05, "optim/total_tokens": 1974737043456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2860937118530273, "created_at": "2025-06-03T08:10:35.859736+00:00"} {"global_step": 235408, "acc_step": 0, "speed/wps": 5513.491163913498, "speed/FLOPS": 243668088838939.8, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05269894003868103, "optim/lr": 1.2745179764499736e-05, "optim/total_tokens": 1974745432064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2629989385604858, "created_at": "2025-06-03T08:10:38.839271+00:00"} {"global_step": 235409, "acc_step": 0, "speed/wps": 5539.055884851955, "speed/FLOPS": 244797918652315.8, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.37, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049120642244815826, "optim/lr": 1.274163253940519e-05, "optim/total_tokens": 1974753820672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2669222354888916, "created_at": "2025-06-03T08:10:41.801933+00:00"} {"global_step": 235410, "acc_step": 0, "speed/wps": 5537.102024360592, "speed/FLOPS": 244711568019362.12, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.44, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05184706673026085, "optim/lr": 1.2738085314310643e-05, "optim/total_tokens": 1974762209280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2854599952697754, "created_at": "2025-06-03T08:10:44.769130+00:00"} {"global_step": 235411, "acc_step": 0, "speed/wps": 5528.730774696055, "speed/FLOPS": 244341601632129.66, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04950730502605438, "optim/lr": 1.2734538089216319e-05, "optim/total_tokens": 1974770597888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2550349235534668, "created_at": "2025-06-03T08:10:47.737231+00:00"} {"global_step": 235412, "acc_step": 0, "speed/wps": 5528.61727059599, "speed/FLOPS": 244336585331873.44, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04924152046442032, "optim/lr": 1.2730990864121772e-05, "optim/total_tokens": 1974778986496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2673835754394531, "created_at": "2025-06-03T08:10:50.705387+00:00"} {"global_step": 235413, "acc_step": 0, "speed/wps": 5512.124776090002, "speed/FLOPS": 243607701490948.2, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04684657230973244, "optim/lr": 1.2727443639027226e-05, "optim/total_tokens": 1974787375104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2745634317398071, "created_at": "2025-06-03T08:10:53.683935+00:00"} {"global_step": 235414, "acc_step": 0, "speed/wps": 5511.134803969512, "speed/FLOPS": 243563949790359.2, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.96 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.96, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04708709940314293, "optim/lr": 1.27238964139329e-05, "optim/total_tokens": 1974795763712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2523486614227295, "created_at": "2025-06-03T08:10:56.661686+00:00"} {"global_step": 235415, "acc_step": 0, "speed/wps": 5523.574085654529, "speed/FLOPS": 244113702370821.44, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048069681972265244, "optim/lr": 1.2720349188838354e-05, "optim/total_tokens": 1974804152320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.270644187927246, "created_at": "2025-06-03T08:10:59.632282+00:00"} {"global_step": 235416, "acc_step": 0, "speed/wps": 5526.272727960734, "speed/FLOPS": 244232968547852.22, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04553075507283211, "optim/lr": 1.2716801963743807e-05, "optim/total_tokens": 1974812540928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2579188346862793, "created_at": "2025-06-03T08:11:02.605848+00:00"} {"global_step": 235417, "acc_step": 0, "speed/wps": 5526.223632701054, "speed/FLOPS": 244230798788666.66, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048687566071748734, "optim/lr": 1.271325473864926e-05, "optim/total_tokens": 1974820929536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2677581310272217, "created_at": "2025-06-03T08:11:05.578919+00:00"} {"global_step": 235418, "acc_step": 0, "speed/wps": 5525.172935080056, "speed/FLOPS": 244184363331776.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04650342836976051, "optim/lr": 1.2709707513554936e-05, "optim/total_tokens": 1974829318144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.273346185684204, "created_at": "2025-06-03T08:11:08.548664+00:00"} {"global_step": 235419, "acc_step": 0, "speed/wps": 5531.526830280239, "speed/FLOPS": 244465172977440.72, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04652658849954605, "optim/lr": 1.2706160288460388e-05, "optim/total_tokens": 1974837706752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.267964243888855, "created_at": "2025-06-03T08:11:11.514872+00:00"} {"global_step": 235420, "acc_step": 0, "speed/wps": 5522.061032758089, "speed/FLOPS": 244046833177305.56, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04990233853459358, "optim/lr": 1.2702613063365842e-05, "optim/total_tokens": 1974846095360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.268949031829834, "created_at": "2025-06-03T08:11:14.486758+00:00"} {"global_step": 235421, "acc_step": 0, "speed/wps": 5514.623908580831, "speed/FLOPS": 243718150355323.12, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04600268974900246, "optim/lr": 1.2699065838271295e-05, "optim/total_tokens": 1974854483968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2672449350357056, "created_at": "2025-06-03T08:11:17.462553+00:00"} {"global_step": 235422, "acc_step": 0, "speed/wps": 5515.369042068915, "speed/FLOPS": 243751081441557.53, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0476347953081131, "optim/lr": 1.2695518613176971e-05, "optim/total_tokens": 1974862872576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2535525560379028, "created_at": "2025-06-03T08:11:20.439027+00:00"} {"global_step": 235423, "acc_step": 0, "speed/wps": 5517.997766099775, "speed/FLOPS": 243867257588692.2, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05058978870511055, "optim/lr": 1.2691971388082425e-05, "optim/total_tokens": 1974871261184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.274165153503418, "created_at": "2025-06-03T08:11:23.412884+00:00"} {"global_step": 235424, "acc_step": 0, "speed/wps": 5512.835232505525, "speed/FLOPS": 243639100028068.7, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046257197856903076, "optim/lr": 1.2688424162987876e-05, "optim/total_tokens": 1974879649792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2624067068099976, "created_at": "2025-06-03T08:11:26.389371+00:00"} {"global_step": 235425, "acc_step": 0, "speed/wps": 5513.171394181655, "speed/FLOPS": 243653956653522.22, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05298468470573425, "optim/lr": 1.268487693789333e-05, "optim/total_tokens": 1974888038400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2676901817321777, "created_at": "2025-06-03T08:11:29.366208+00:00"} {"global_step": 235426, "acc_step": 0, "speed/wps": 5537.176449060733, "speed/FLOPS": 244714857210168.22, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.45, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04821458086371422, "optim/lr": 1.2681329712799006e-05, "optim/total_tokens": 1974896427008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.258618950843811, "created_at": "2025-06-03T08:11:32.330346+00:00"} {"global_step": 235427, "acc_step": 0, "speed/wps": 5536.322502347626, "speed/FLOPS": 244677117136344.4, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.48, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04829651489853859, "optim/lr": 1.267778248770446e-05, "optim/total_tokens": 1974904815616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2682567834854126, "created_at": "2025-06-03T08:11:35.294131+00:00"} {"global_step": 235428, "acc_step": 0, "speed/wps": 5519.266578120851, "speed/FLOPS": 243923332585655.1, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05491150543093681, "optim/lr": 1.2674235262609913e-05, "optim/total_tokens": 1974913204224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2702995538711548, "created_at": "2025-06-03T08:11:38.267682+00:00"} {"global_step": 235429, "acc_step": 0, "speed/wps": 5513.296079438197, "speed/FLOPS": 243659467103664.38, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.95 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.95, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04611209034919739, "optim/lr": 1.2670688037515365e-05, "optim/total_tokens": 1974921592832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2722853422164917, "created_at": "2025-06-03T08:11:41.244022+00:00"} {"global_step": 235430, "acc_step": 0, "speed/wps": 5531.618253720438, "speed/FLOPS": 244469213425549.94, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.059521403163671494, "optim/lr": 1.266714081242104e-05, "optim/total_tokens": 1974929981440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.263129711151123, "created_at": "2025-06-03T08:11:44.214256+00:00"} {"global_step": 235431, "acc_step": 0, "speed/wps": 5527.503784901183, "speed/FLOPS": 244287374963499.4, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04675416648387909, "optim/lr": 1.2663593587326494e-05, "optim/total_tokens": 1974938370048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2612431049346924, "created_at": "2025-06-03T08:11:47.183130+00:00"} {"global_step": 235432, "acc_step": 0, "speed/wps": 5517.806501035223, "speed/FLOPS": 243858804651822.34, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04853733256459236, "optim/lr": 1.2660046362231947e-05, "optim/total_tokens": 1974946758656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2746113538742065, "created_at": "2025-06-03T08:11:50.161078+00:00"} {"global_step": 235433, "acc_step": 0, "speed/wps": 5516.94340782508, "speed/FLOPS": 243820660349645.53, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04990195482969284, "optim/lr": 1.2656499137137401e-05, "optim/total_tokens": 1974955147264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2736411094665527, "created_at": "2025-06-03T08:11:53.135977+00:00"} {"global_step": 235434, "acc_step": 0, "speed/wps": 5531.581327769528, "speed/FLOPS": 244467581487523.88, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046908218413591385, "optim/lr": 1.2652951912043077e-05, "optim/total_tokens": 1974963535872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2702312469482422, "created_at": "2025-06-03T08:11:56.102586+00:00"} {"global_step": 235435, "acc_step": 0, "speed/wps": 5525.515986240275, "speed/FLOPS": 244199524437163.16, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.76, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.051600512117147446, "optim/lr": 1.2649404686948528e-05, "optim/total_tokens": 1974971924480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2695456743240356, "created_at": "2025-06-03T08:11:59.072501+00:00"} {"global_step": 235436, "acc_step": 0, "speed/wps": 5523.574012814545, "speed/FLOPS": 244113699151666.97, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04642303287982941, "optim/lr": 1.2645857461853982e-05, "optim/total_tokens": 1974980313088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.274971842765808, "created_at": "2025-06-03T08:12:02.043389+00:00"} {"global_step": 235437, "acc_step": 0, "speed/wps": 5524.45583170644, "speed/FLOPS": 244152671033130.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04680798575282097, "optim/lr": 1.2642310236759436e-05, "optim/total_tokens": 1974988701696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2683719396591187, "created_at": "2025-06-03T08:12:05.014537+00:00"} {"global_step": 235438, "acc_step": 0, "speed/wps": 5525.47838157377, "speed/FLOPS": 244197862503381.78, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04666699469089508, "optim/lr": 1.2638763011665111e-05, "optim/total_tokens": 1974997090304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.265596866607666, "created_at": "2025-06-03T08:12:07.983850+00:00"} {"global_step": 235439, "acc_step": 0, "speed/wps": 5523.366831156055, "speed/FLOPS": 244104542782813.56, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04713311418890953, "optim/lr": 1.2635215786570565e-05, "optim/total_tokens": 1975005478912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2697147130966187, "created_at": "2025-06-03T08:12:10.960686+00:00"} {"global_step": 235440, "acc_step": 0, "speed/wps": 5513.4268050856235, "speed/FLOPS": 243665244508166.1, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04660193249583244, "optim/lr": 1.2631668561476017e-05, "optim/total_tokens": 1975013867520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2777631282806396, "created_at": "2025-06-03T08:12:13.936808+00:00"} {"global_step": 235441, "acc_step": 0, "speed/wps": 5514.377581576155, "speed/FLOPS": 243707263962532.34, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04657445847988129, "optim/lr": 1.2628121336381692e-05, "optim/total_tokens": 1975022256128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.261893391609192, "created_at": "2025-06-03T08:12:16.912294+00:00"} {"global_step": 235442, "acc_step": 0, "speed/wps": 5529.01633518045, "speed/FLOPS": 244354221943908.88, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04614154249429703, "optim/lr": 1.2624574111287146e-05, "optim/total_tokens": 1975030644736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2777888774871826, "created_at": "2025-06-03T08:12:19.880193+00:00"} {"global_step": 235443, "acc_step": 0, "speed/wps": 5523.022240464482, "speed/FLOPS": 244089313638021.1, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04582544043660164, "optim/lr": 1.26210268861926e-05, "optim/total_tokens": 1975039033344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.260259985923767, "created_at": "2025-06-03T08:12:22.851357+00:00"} {"global_step": 235444, "acc_step": 0, "speed/wps": 5514.505578501224, "speed/FLOPS": 243712920771472.72, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047352857887744904, "optim/lr": 1.2617479661098053e-05, "optim/total_tokens": 1975047421952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2568408250808716, "created_at": "2025-06-03T08:12:25.826851+00:00"} {"global_step": 235445, "acc_step": 0, "speed/wps": 5507.85331416198, "speed/FLOPS": 243418924737053.7, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.94 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.94, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04824385419487953, "optim/lr": 1.2613932436003727e-05, "optim/total_tokens": 1975055810560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2681593894958496, "created_at": "2025-06-03T08:12:28.806345+00:00"} {"global_step": 235446, "acc_step": 0, "speed/wps": 5522.361830493136, "speed/FLOPS": 244060126897572.25, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046325623989105225, "optim/lr": 1.261038521090918e-05, "optim/total_tokens": 1975064199168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2605334520339966, "created_at": "2025-06-03T08:12:31.781100+00:00"} {"global_step": 235447, "acc_step": 0, "speed/wps": 5516.095554595582, "speed/FLOPS": 243783189576607.97, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04668954759836197, "optim/lr": 1.2606837985814634e-05, "optim/total_tokens": 1975072587776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.25941801071167, "created_at": "2025-06-03T08:12:34.756619+00:00"} {"global_step": 235448, "acc_step": 0, "speed/wps": 5522.34854566241, "speed/FLOPS": 244059539776052.1, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04782142862677574, "optim/lr": 1.2603290760720088e-05, "optim/total_tokens": 1975080976384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2526658773422241, "created_at": "2025-06-03T08:12:37.728254+00:00"} {"global_step": 235449, "acc_step": 0, "speed/wps": 5512.309844426026, "speed/FLOPS": 243615880564134.8, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04592740535736084, "optim/lr": 1.2599743535625763e-05, "optim/total_tokens": 1975089364992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2885621786117554, "created_at": "2025-06-03T08:12:40.707671+00:00"} {"global_step": 235450, "acc_step": 0, "speed/wps": 5507.7881927923445, "speed/FLOPS": 243416046705837.2, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04835706949234009, "optim/lr": 1.2596196310531217e-05, "optim/total_tokens": 1975097753600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.256976842880249, "created_at": "2025-06-03T08:12:43.687075+00:00"} {"global_step": 235451, "acc_step": 0, "speed/wps": 5507.268672031986, "speed/FLOPS": 243393086547377.66, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.93 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.93, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04841938614845276, "optim/lr": 1.2592649085436669e-05, "optim/total_tokens": 1975106142208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2908164262771606, "created_at": "2025-06-03T08:12:46.670691+00:00"} {"global_step": 235452, "acc_step": 0, "speed/wps": 5521.785507718084, "speed/FLOPS": 244034656380802.34, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05227360501885414, "optim/lr": 1.2589101860342122e-05, "optim/total_tokens": 1975114530816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2611620426177979, "created_at": "2025-06-03T08:12:49.646884+00:00"} {"global_step": 235453, "acc_step": 0, "speed/wps": 5533.1053977075635, "speed/FLOPS": 244534937577887.94, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0461668036878109, "optim/lr": 1.2585554635247798e-05, "optim/total_tokens": 1975122919424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2677507400512695, "created_at": "2025-06-03T08:12:52.615047+00:00"} {"global_step": 235454, "acc_step": 0, "speed/wps": 5535.288810607739, "speed/FLOPS": 244631433252355.38, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04604100063443184, "optim/lr": 1.2582007410153252e-05, "optim/total_tokens": 1975131308032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2637168169021606, "created_at": "2025-06-03T08:12:55.579695+00:00"} {"global_step": 235455, "acc_step": 0, "speed/wps": 5530.174648830993, "speed/FLOPS": 244405413478476.12, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.050293926149606705, "optim/lr": 1.2578460185058705e-05, "optim/total_tokens": 1975139696640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2627005577087402, "created_at": "2025-06-03T08:12:58.546835+00:00"} {"global_step": 235456, "acc_step": 0, "speed/wps": 5519.238471666281, "speed/FLOPS": 243922090424224.97, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04662338271737099, "optim/lr": 1.2574912959964157e-05, "optim/total_tokens": 1975148085248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2615848779678345, "created_at": "2025-06-03T08:13:01.520145+00:00"} {"global_step": 235457, "acc_step": 0, "speed/wps": 5516.046219712619, "speed/FLOPS": 243781009227299.8, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04655845835804939, "optim/lr": 1.2571365734869833e-05, "optim/total_tokens": 1975156473856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2448534965515137, "created_at": "2025-06-03T08:13:04.495519+00:00"} {"global_step": 235458, "acc_step": 0, "speed/wps": 5510.345192371439, "speed/FLOPS": 243529052999322.88, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045770082622766495, "optim/lr": 1.2567818509775286e-05, "optim/total_tokens": 1975164862464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2694666385650635, "created_at": "2025-06-03T08:13:07.473942+00:00"} {"global_step": 235459, "acc_step": 0, "speed/wps": 5527.745771339728, "speed/FLOPS": 244298069525484.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04819563776254654, "optim/lr": 1.256427128468074e-05, "optim/total_tokens": 1975173251072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2682608366012573, "created_at": "2025-06-03T08:13:10.442594+00:00"} {"global_step": 235460, "acc_step": 0, "speed/wps": 5522.293999391247, "speed/FLOPS": 244057129110059.8, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0462007112801075, "optim/lr": 1.2560724059586193e-05, "optim/total_tokens": 1975181639680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2590121030807495, "created_at": "2025-06-03T08:13:13.417041+00:00"} {"global_step": 235461, "acc_step": 0, "speed/wps": 5510.580798960425, "speed/FLOPS": 243539465604612.25, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047151725739240646, "optim/lr": 1.2557176834491867e-05, "optim/total_tokens": 1975190028288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2660688161849976, "created_at": "2025-06-03T08:13:16.396103+00:00"} {"global_step": 235462, "acc_step": 0, "speed/wps": 5524.822298271209, "speed/FLOPS": 244168866979547.3, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04601695016026497, "optim/lr": 1.255362960939732e-05, "optim/total_tokens": 1975198416896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2555803060531616, "created_at": "2025-06-03T08:13:19.368399+00:00"} {"global_step": 235463, "acc_step": 0, "speed/wps": 5509.844891102999, "speed/FLOPS": 243506942244031.88, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04649090766906738, "optim/lr": 1.2550082384302774e-05, "optim/total_tokens": 1975206805504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2518948316574097, "created_at": "2025-06-03T08:13:22.346512+00:00"} {"global_step": 235464, "acc_step": 0, "speed/wps": 5516.524777249966, "speed/FLOPS": 243802159020971.03, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04667491093277931, "optim/lr": 1.2546535159208228e-05, "optim/total_tokens": 1975215194112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.251907467842102, "created_at": "2025-06-03T08:13:25.321247+00:00"} {"global_step": 235465, "acc_step": 0, "speed/wps": 5513.538569161718, "speed/FLOPS": 243670183908269.1, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045442648231983185, "optim/lr": 1.2542987934113904e-05, "optim/total_tokens": 1975223582720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.25625741481781, "created_at": "2025-06-03T08:13:28.301570+00:00"} {"global_step": 235466, "acc_step": 0, "speed/wps": 5514.729332646179, "speed/FLOPS": 243722809559402.2, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.92 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.92, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04716126248240471, "optim/lr": 1.2539440709019355e-05, "optim/total_tokens": 1975231971328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.267777442932129, "created_at": "2025-06-03T08:13:31.277209+00:00"} {"global_step": 235467, "acc_step": 0, "speed/wps": 5520.494632618213, "speed/FLOPS": 243977606308685.75, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045589786022901535, "optim/lr": 1.2535893483924809e-05, "optim/total_tokens": 1975240359936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2661348581314087, "created_at": "2025-06-03T08:13:34.254082+00:00"} {"global_step": 235468, "acc_step": 0, "speed/wps": 5521.196326575776, "speed/FLOPS": 244008617590014.78, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04685782268643379, "optim/lr": 1.2532346258830263e-05, "optim/total_tokens": 1975248748544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2756410837173462, "created_at": "2025-06-03T08:13:37.226614+00:00"} {"global_step": 235469, "acc_step": 0, "speed/wps": 5526.508703343203, "speed/FLOPS": 244243397451925.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04607006162405014, "optim/lr": 1.2528799033735938e-05, "optim/total_tokens": 1975257137152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2603968381881714, "created_at": "2025-06-03T08:13:40.195785+00:00"} {"global_step": 235470, "acc_step": 0, "speed/wps": 5521.274847887182, "speed/FLOPS": 244012087830070.4, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04559572413563728, "optim/lr": 1.2525251808641392e-05, "optim/total_tokens": 1975265525760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2682424783706665, "created_at": "2025-06-03T08:13:43.171187+00:00"} {"global_step": 235471, "acc_step": 0, "speed/wps": 5521.010067190985, "speed/FLOPS": 244000385878568.97, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04573333263397217, "optim/lr": 1.2521704583546845e-05, "optim/total_tokens": 1975273914368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2598353624343872, "created_at": "2025-06-03T08:13:46.143290+00:00"} {"global_step": 235472, "acc_step": 0, "speed/wps": 5517.865905468345, "speed/FLOPS": 243861430023706.88, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04601126164197922, "optim/lr": 1.251815735845252e-05, "optim/total_tokens": 1975282302976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2875252962112427, "created_at": "2025-06-03T08:13:49.117196+00:00"} {"global_step": 235473, "acc_step": 0, "speed/wps": 5513.879231312437, "speed/FLOPS": 243685239431663.88, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04783519357442856, "optim/lr": 1.2514610133357973e-05, "optim/total_tokens": 1975290691584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.248448133468628, "created_at": "2025-06-03T08:13:52.096174+00:00"} {"global_step": 235474, "acc_step": 0, "speed/wps": 5513.503241944797, "speed/FLOPS": 243668622626102.25, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046373214572668076, "optim/lr": 1.2511062908263426e-05, "optim/total_tokens": 1975299080192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2547085285186768, "created_at": "2025-06-03T08:13:55.072974+00:00"} {"global_step": 235475, "acc_step": 0, "speed/wps": 5503.707919762852, "speed/FLOPS": 243235719522664.22, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048240918666124344, "optim/lr": 1.250751568316888e-05, "optim/total_tokens": 1975307468800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2632040977478027, "created_at": "2025-06-03T08:13:58.054574+00:00"} {"global_step": 235476, "acc_step": 0, "speed/wps": 5523.8029358230815, "speed/FLOPS": 244123816376910.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04693560674786568, "optim/lr": 1.2503968458074556e-05, "optim/total_tokens": 1975315857408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2668119668960571, "created_at": "2025-06-03T08:14:01.029532+00:00"} {"global_step": 235477, "acc_step": 0, "speed/wps": 5518.700119945735, "speed/FLOPS": 243898298033710.78, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046305038034915924, "optim/lr": 1.2500421232980008e-05, "optim/total_tokens": 1975324246016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2768969535827637, "created_at": "2025-06-03T08:14:04.002886+00:00"} {"global_step": 235478, "acc_step": 0, "speed/wps": 5521.388346161928, "speed/FLOPS": 244017103872877.38, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049916476011276245, "optim/lr": 1.2496874007885461e-05, "optim/total_tokens": 1975332634624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2685332298278809, "created_at": "2025-06-03T08:14:06.978774+00:00"} {"global_step": 235479, "acc_step": 0, "speed/wps": 5511.168185285249, "speed/FLOPS": 243565425073653.7, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04669344797730446, "optim/lr": 1.2493326782790915e-05, "optim/total_tokens": 1975341023232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.271654486656189, "created_at": "2025-06-03T08:14:09.959438+00:00"} {"global_step": 235480, "acc_step": 0, "speed/wps": 5523.509221108852, "speed/FLOPS": 244110835689909.34, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04732297733426094, "optim/lr": 1.248977955769659e-05, "optim/total_tokens": 1975349411840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.244828224182129, "created_at": "2025-06-03T08:14:12.930340+00:00"} {"global_step": 235481, "acc_step": 0, "speed/wps": 5522.556499554461, "speed/FLOPS": 244068730273676.25, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05513482168316841, "optim/lr": 1.2486232332602044e-05, "optim/total_tokens": 1975357800448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.270155906677246, "created_at": "2025-06-03T08:14:15.902137+00:00"} {"global_step": 235482, "acc_step": 0, "speed/wps": 5520.3133717392575, "speed/FLOPS": 243969595505613.22, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047725144773721695, "optim/lr": 1.2482685107507496e-05, "optim/total_tokens": 1975366189056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2649697065353394, "created_at": "2025-06-03T08:14:18.877060+00:00"} {"global_step": 235483, "acc_step": 0, "speed/wps": 5502.762605752865, "speed/FLOPS": 243193941481978.53, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.91 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.91, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05004969984292984, "optim/lr": 1.247913788241295e-05, "optim/total_tokens": 1975374577664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2556754350662231, "created_at": "2025-06-03T08:14:21.859291+00:00"} {"global_step": 235484, "acc_step": 0, "speed/wps": 5520.057852423535, "speed/FLOPS": 243958302859724.72, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045676346868276596, "optim/lr": 1.2475590657318625e-05, "optim/total_tokens": 1975382966272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2618322372436523, "created_at": "2025-06-03T08:14:24.832491+00:00"} {"global_step": 235485, "acc_step": 0, "speed/wps": 5526.869802200764, "speed/FLOPS": 244259356173158.5, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04765765741467476, "optim/lr": 1.2472043432224079e-05, "optim/total_tokens": 1975391354880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.262582540512085, "created_at": "2025-06-03T08:14:27.801321+00:00"} {"global_step": 235486, "acc_step": 0, "speed/wps": 5525.331106908921, "speed/FLOPS": 244191353717015.53, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0470888651907444, "optim/lr": 1.2468496207129532e-05, "optim/total_tokens": 1975399743488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2628031969070435, "created_at": "2025-06-03T08:14:30.774420+00:00"} {"global_step": 235487, "acc_step": 0, "speed/wps": 5527.125817980247, "speed/FLOPS": 244270670760204.12, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046495597809553146, "optim/lr": 1.2464948982034984e-05, "optim/total_tokens": 1975408132096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2835222482681274, "created_at": "2025-06-03T08:14:33.746368+00:00"} {"global_step": 235488, "acc_step": 0, "speed/wps": 5530.449299200729, "speed/FLOPS": 244417551619030.44, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04768815636634827, "optim/lr": 1.246140175694066e-05, "optim/total_tokens": 1975416520704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2916598320007324, "created_at": "2025-06-03T08:14:36.714970+00:00"} {"global_step": 235489, "acc_step": 0, "speed/wps": 5515.076641091781, "speed/FLOPS": 243738158815012.06, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0470871776342392, "optim/lr": 1.2457854531846113e-05, "optim/total_tokens": 1975424909312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2677468061447144, "created_at": "2025-06-03T08:14:39.692681+00:00"} {"global_step": 235490, "acc_step": 0, "speed/wps": 5517.672438293432, "speed/FLOPS": 243852879764830.47, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04659112170338631, "optim/lr": 1.2454307306751567e-05, "optim/total_tokens": 1975433297920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.28768789768219, "created_at": "2025-06-03T08:14:42.670006+00:00"} {"global_step": 235491, "acc_step": 0, "speed/wps": 5499.056940788704, "speed/FLOPS": 243030170057875.34, "speed/curr_iter_time": 2.9785, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9785, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04642907530069351, "optim/lr": 1.245076008165702e-05, "optim/total_tokens": 1975441686528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2728554010391235, "created_at": "2025-06-03T08:14:45.654091+00:00"} {"global_step": 235492, "acc_step": 0, "speed/wps": 5525.768246466695, "speed/FLOPS": 244210673047986.03, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046072229743003845, "optim/lr": 1.2447212856562696e-05, "optim/total_tokens": 1975450075136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2768285274505615, "created_at": "2025-06-03T08:14:48.623477+00:00"} {"global_step": 235493, "acc_step": 0, "speed/wps": 5518.081695758181, "speed/FLOPS": 243870966850002.8, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04792553558945656, "optim/lr": 1.2443665631468148e-05, "optim/total_tokens": 1975458463744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2600597143173218, "created_at": "2025-06-03T08:14:51.602967+00:00"} {"global_step": 235494, "acc_step": 0, "speed/wps": 5509.773245040207, "speed/FLOPS": 243503775854774.25, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.9 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.9, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04580477625131607, "optim/lr": 1.2440118406373601e-05, "optim/total_tokens": 1975466852352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2586088180541992, "created_at": "2025-06-03T08:14:54.584771+00:00"} {"global_step": 235495, "acc_step": 0, "speed/wps": 5521.613976765625, "speed/FLOPS": 244027075590678.66, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04718886688351631, "optim/lr": 1.2436571181279055e-05, "optim/total_tokens": 1975475240960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2558778524398804, "created_at": "2025-06-03T08:14:57.556526+00:00"} {"global_step": 235496, "acc_step": 0, "speed/wps": 5519.844101921769, "speed/FLOPS": 243948856181620.88, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046432506293058395, "optim/lr": 1.243302395618473e-05, "optim/total_tokens": 1975483629568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.268189787864685, "created_at": "2025-06-03T08:15:00.532900+00:00"} {"global_step": 235497, "acc_step": 0, "speed/wps": 5524.372457464916, "speed/FLOPS": 244148986318403.16, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05624133348464966, "optim/lr": 1.2429476731090184e-05, "optim/total_tokens": 1975492018176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.268518328666687, "created_at": "2025-06-03T08:15:03.503217+00:00"} {"global_step": 235498, "acc_step": 0, "speed/wps": 5519.382323783252, "speed/FLOPS": 243928447951493.22, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046150825917720795, "optim/lr": 1.2425929505995636e-05, "optim/total_tokens": 1975500406784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2616111040115356, "created_at": "2025-06-03T08:15:06.475987+00:00"} {"global_step": 235499, "acc_step": 0, "speed/wps": 5504.055433366642, "speed/FLOPS": 243251077845215.9, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.053181346505880356, "optim/lr": 1.2422382280901312e-05, "optim/total_tokens": 1975508795392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2641865015029907, "created_at": "2025-06-03T08:15:09.457277+00:00"} {"global_step": 235500, "acc_step": 0, "speed/wps": 5519.966691631934, "speed/FLOPS": 243954274019339.16, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04773147776722908, "optim/lr": 1.2418835055806765e-05, "optim/total_tokens": 1975517184000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2611035108566284, "created_at": "2025-06-03T08:15:12.430792+00:00"} {"global_step": 235501, "acc_step": 0, "speed/wps": 5529.247586843428, "speed/FLOPS": 244364442083759.16, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.050376858562231064, "optim/lr": 1.2415287830712219e-05, "optim/total_tokens": 1975525572608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2700188159942627, "created_at": "2025-06-03T08:15:15.398467+00:00"} {"global_step": 235502, "acc_step": 0, "speed/wps": 5515.524114981724, "speed/FLOPS": 243757934870568.53, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04935818538069725, "optim/lr": 1.2411740605617672e-05, "optim/total_tokens": 1975533961216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2754536867141724, "created_at": "2025-06-03T08:15:18.378192+00:00"} {"global_step": 235503, "acc_step": 0, "speed/wps": 5516.166431173437, "speed/FLOPS": 243786321958569.94, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04739081487059593, "optim/lr": 1.2408193380523348e-05, "optim/total_tokens": 1975542349824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2718181610107422, "created_at": "2025-06-03T08:15:21.353099+00:00"} {"global_step": 235504, "acc_step": 0, "speed/wps": 5525.014397071949, "speed/FLOPS": 244177356763289.25, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049908459186553955, "optim/lr": 1.24046461554288e-05, "optim/total_tokens": 1975550738432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2618769407272339, "created_at": "2025-06-03T08:15:24.327532+00:00"} {"global_step": 235505, "acc_step": 0, "speed/wps": 5523.859728118828, "speed/FLOPS": 244126326305692.75, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047055434435606, "optim/lr": 1.2401098930334253e-05, "optim/total_tokens": 1975559127040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2675882577896118, "created_at": "2025-06-03T08:15:27.298798+00:00"} {"global_step": 235506, "acc_step": 0, "speed/wps": 5524.869816588281, "speed/FLOPS": 244170967045941.12, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.051899634301662445, "optim/lr": 1.2397551705239707e-05, "optim/total_tokens": 1975567515648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2688339948654175, "created_at": "2025-06-03T08:15:30.269356+00:00"} {"global_step": 235507, "acc_step": 0, "speed/wps": 5513.652616216181, "speed/FLOPS": 243675224204330.6, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04735178500413895, "optim/lr": 1.2394004480145383e-05, "optim/total_tokens": 1975575904256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.261613368988037, "created_at": "2025-06-03T08:15:33.245897+00:00"} {"global_step": 235508, "acc_step": 0, "speed/wps": 5506.587711919154, "speed/FLOPS": 243362991595860.28, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.89 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.89, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047575339674949646, "optim/lr": 1.2390457255050836e-05, "optim/total_tokens": 1975584292864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.248053789138794, "created_at": "2025-06-03T08:15:36.225630+00:00"} {"global_step": 235509, "acc_step": 0, "speed/wps": 5523.942961999427, "speed/FLOPS": 244130004817185.62, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05098557844758034, "optim/lr": 1.2386910029956288e-05, "optim/total_tokens": 1975592681472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.26799476146698, "created_at": "2025-06-03T08:15:39.200803+00:00"} {"global_step": 235510, "acc_step": 0, "speed/wps": 5527.088814365609, "speed/FLOPS": 244269035389838.8, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04657889902591705, "optim/lr": 1.2383362804861742e-05, "optim/total_tokens": 1975601070080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.276755452156067, "created_at": "2025-06-03T08:15:42.169164+00:00"} {"global_step": 235511, "acc_step": 0, "speed/wps": 5514.239652542081, "speed/FLOPS": 243701168205211.06, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04758588969707489, "optim/lr": 1.2379815579767417e-05, "optim/total_tokens": 1975609458688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2674944400787354, "created_at": "2025-06-03T08:15:45.144600+00:00"} {"global_step": 235512, "acc_step": 0, "speed/wps": 5518.294801743964, "speed/FLOPS": 243880385043799.1, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04675554484128952, "optim/lr": 1.2376268354672871e-05, "optim/total_tokens": 1975617847296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2619284391403198, "created_at": "2025-06-03T08:15:48.121463+00:00"} {"global_step": 235513, "acc_step": 0, "speed/wps": 5526.696157776967, "speed/FLOPS": 244251681978419.44, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04674277454614639, "optim/lr": 1.2372721129578324e-05, "optim/total_tokens": 1975626235904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2778834104537964, "created_at": "2025-06-03T08:15:51.096022+00:00"} {"global_step": 235514, "acc_step": 0, "speed/wps": 5524.893684281083, "speed/FLOPS": 244172021875797.03, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045994438230991364, "optim/lr": 1.2369173904483776e-05, "optim/total_tokens": 1975634624512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.253970742225647, "created_at": "2025-06-03T08:15:54.070092+00:00"} {"global_step": 235515, "acc_step": 0, "speed/wps": 5505.461986132002, "speed/FLOPS": 243313240278055.1, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.88 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.88, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046541474759578705, "optim/lr": 1.2365626679389452e-05, "optim/total_tokens": 1975643013120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2835183143615723, "created_at": "2025-06-03T08:15:57.051013+00:00"} {"global_step": 235516, "acc_step": 0, "speed/wps": 5513.517100275452, "speed/FLOPS": 243669235093383.84, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04816228896379471, "optim/lr": 1.2362079454294906e-05, "optim/total_tokens": 1975651401728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2681975364685059, "created_at": "2025-06-03T08:16:00.027504+00:00"} {"global_step": 235517, "acc_step": 0, "speed/wps": 5514.536177834539, "speed/FLOPS": 243714273105383.66, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04567055404186249, "optim/lr": 1.2358532229200359e-05, "optim/total_tokens": 1975659790336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2665355205535889, "created_at": "2025-06-03T08:16:03.006076+00:00"} {"global_step": 235518, "acc_step": 0, "speed/wps": 5535.496960355288, "speed/FLOPS": 244640632405790.06, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04687993600964546, "optim/lr": 1.2354985004105813e-05, "optim/total_tokens": 1975668178944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.273931622505188, "created_at": "2025-06-03T08:16:05.970404+00:00"} {"global_step": 235519, "acc_step": 0, "speed/wps": 5521.146598043547, "speed/FLOPS": 244006419843423.97, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04577482491731644, "optim/lr": 1.2351437779011487e-05, "optim/total_tokens": 1975676567552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.269059419631958, "created_at": "2025-06-03T08:16:08.942822+00:00"} {"global_step": 235520, "acc_step": 0, "speed/wps": 5520.639173470293, "speed/FLOPS": 243983994274520.56, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04606706276535988, "optim/lr": 1.234789055391694e-05, "optim/total_tokens": 1975684956160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2895954847335815, "created_at": "2025-06-03T08:16:11.919911+00:00"} {"global_step": 235521, "acc_step": 0, "speed/wps": 5524.4081249105375, "speed/FLOPS": 244150562636937.1, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046021442860364914, "optim/lr": 1.2344343328822394e-05, "optim/total_tokens": 1975693344768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2616419792175293, "created_at": "2025-06-03T08:16:14.890078+00:00"} {"global_step": 235522, "acc_step": 0, "speed/wps": 5518.157725166722, "speed/FLOPS": 243874326960706.53, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04659226909279823, "optim/lr": 1.2340796103727847e-05, "optim/total_tokens": 1975701733376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2557412385940552, "created_at": "2025-06-03T08:16:17.866298+00:00"} {"global_step": 235523, "acc_step": 0, "speed/wps": 5512.782122133924, "speed/FLOPS": 243636752821487.44, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04654306545853615, "optim/lr": 1.2337248878633523e-05, "optim/total_tokens": 1975710121984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2490160465240479, "created_at": "2025-06-03T08:16:20.842547+00:00"} {"global_step": 235524, "acc_step": 0, "speed/wps": 5513.093751078802, "speed/FLOPS": 243650525225789.5, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046402521431446075, "optim/lr": 1.2333701653538975e-05, "optim/total_tokens": 1975718510592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2659368515014648, "created_at": "2025-06-03T08:16:23.819395+00:00"} {"global_step": 235525, "acc_step": 0, "speed/wps": 5519.11532645909, "speed/FLOPS": 243916648036381.47, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046526141464710236, "optim/lr": 1.2330154428444428e-05, "optim/total_tokens": 1975726899200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2723592519760132, "created_at": "2025-06-03T08:16:26.796020+00:00"} {"global_step": 235526, "acc_step": 0, "speed/wps": 5526.634414938915, "speed/FLOPS": 244248953261006.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 193.9, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04946598783135414, "optim/lr": 1.2326607203350104e-05, "optim/total_tokens": 1975735287808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2626314163208008, "created_at": "2025-06-03T08:16:29.765226+00:00"} {"global_step": 235527, "acc_step": 0, "speed/wps": 5512.710095197392, "speed/FLOPS": 243633569599560.0, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.87 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.87, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.051775507628917694, "optim/lr": 1.2323059978255558e-05, "optim/total_tokens": 1975743676416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2538610696792603, "created_at": "2025-06-03T08:16:32.745168+00:00"} {"global_step": 235528, "acc_step": 0, "speed/wps": 5522.781013291901, "speed/FLOPS": 244078652631705.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046840768307447433, "optim/lr": 1.2319512753161011e-05, "optim/total_tokens": 1975752065024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2764381170272827, "created_at": "2025-06-03T08:16:35.719405+00:00"} {"global_step": 235529, "acc_step": 0, "speed/wps": 5521.002073070339, "speed/FLOPS": 244000032579354.06, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049123615026474, "optim/lr": 1.2315965528066465e-05, "optim/total_tokens": 1975760453632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2759205102920532, "created_at": "2025-06-03T08:16:38.691384+00:00"} {"global_step": 235530, "acc_step": 0, "speed/wps": 5520.535618208485, "speed/FLOPS": 243979417661992.53, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04650663211941719, "optim/lr": 1.2312418302972139e-05, "optim/total_tokens": 1975768842240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2610160112380981, "created_at": "2025-06-03T08:16:41.663781+00:00"} {"global_step": 235531, "acc_step": 0, "speed/wps": 5525.329435729946, "speed/FLOPS": 244191279859458.72, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04619390890002251, "optim/lr": 1.2308871077877592e-05, "optim/total_tokens": 1975777230848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2714046239852905, "created_at": "2025-06-03T08:16:44.633634+00:00"} {"global_step": 235532, "acc_step": 0, "speed/wps": 5514.954493237524, "speed/FLOPS": 243732760505063.28, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0489087775349617, "optim/lr": 1.2305323852783046e-05, "optim/total_tokens": 1975785619456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.276991844177246, "created_at": "2025-06-03T08:16:47.611764+00:00"} {"global_step": 235533, "acc_step": 0, "speed/wps": 5526.250384681266, "speed/FLOPS": 244231981089262.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04989895969629288, "optim/lr": 1.23017766276885e-05, "optim/total_tokens": 1975794008064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2607754468917847, "created_at": "2025-06-03T08:16:50.580959+00:00"} {"global_step": 235534, "acc_step": 0, "speed/wps": 5517.805739109864, "speed/FLOPS": 243858770978621.34, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05081574246287346, "optim/lr": 1.2298229402594175e-05, "optim/total_tokens": 1975802396672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2651885747909546, "created_at": "2025-06-03T08:16:53.557576+00:00"} {"global_step": 235535, "acc_step": 0, "speed/wps": 5522.211868254015, "speed/FLOPS": 244053499334179.44, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.052634745836257935, "optim/lr": 1.2294682177499627e-05, "optim/total_tokens": 1975810785280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2635715007781982, "created_at": "2025-06-03T08:16:56.529257+00:00"} {"global_step": 235536, "acc_step": 0, "speed/wps": 5523.840549341615, "speed/FLOPS": 244125478701905.84, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047313205897808075, "optim/lr": 1.229113495240508e-05, "optim/total_tokens": 1975819173888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2657183408737183, "created_at": "2025-06-03T08:16:59.499439+00:00"} {"global_step": 235537, "acc_step": 0, "speed/wps": 5520.06833411355, "speed/FLOPS": 243958766096773.22, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.053572431206703186, "optim/lr": 1.2287587727310534e-05, "optim/total_tokens": 1975827562496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2640599012374878, "created_at": "2025-06-03T08:17:02.473338+00:00"} {"global_step": 235538, "acc_step": 0, "speed/wps": 5522.313351181032, "speed/FLOPS": 244057984360116.88, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04638597369194031, "optim/lr": 1.228404050221621e-05, "optim/total_tokens": 1975835951104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2636373043060303, "created_at": "2025-06-03T08:17:05.444353+00:00"} {"global_step": 235539, "acc_step": 0, "speed/wps": 5514.644068399166, "speed/FLOPS": 243719041316106.22, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049780212342739105, "optim/lr": 1.2280493277121663e-05, "optim/total_tokens": 1975844339712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2605549097061157, "created_at": "2025-06-03T08:17:08.420062+00:00"} {"global_step": 235540, "acc_step": 0, "speed/wps": 5532.306599854834, "speed/FLOPS": 244499634801415.3, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 193.71, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.054580722004175186, "optim/lr": 1.2276946052027115e-05, "optim/total_tokens": 1975852728320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2481528520584106, "created_at": "2025-06-03T08:17:11.385657+00:00"} {"global_step": 235541, "acc_step": 0, "speed/wps": 5522.9458961926575, "speed/FLOPS": 244085939611971.84, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04719337821006775, "optim/lr": 1.2273398826932569e-05, "optim/total_tokens": 1975861116928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.255200982093811, "created_at": "2025-06-03T08:17:14.361020+00:00"} {"global_step": 235542, "acc_step": 0, "speed/wps": 5497.088655299333, "speed/FLOPS": 242943181913843.56, "speed/curr_iter_time": 2.9784, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9784, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.86 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.86, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.051100969314575195, "optim/lr": 1.2269851601838244e-05, "optim/total_tokens": 1975869505536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2672621011734009, "created_at": "2025-06-03T08:17:17.346338+00:00"} {"global_step": 235543, "acc_step": 0, "speed/wps": 5526.692529892409, "speed/FLOPS": 244251521644491.16, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0463157594203949, "optim/lr": 1.2266304376743698e-05, "optim/total_tokens": 1975877894144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2513201236724854, "created_at": "2025-06-03T08:17:20.320039+00:00"} {"global_step": 235544, "acc_step": 0, "speed/wps": 5516.915120441533, "speed/FLOPS": 243819410192080.72, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049114473164081573, "optim/lr": 1.2262757151649151e-05, "optim/total_tokens": 1975886282752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2734038829803467, "created_at": "2025-06-03T08:17:23.298135+00:00"} {"global_step": 235545, "acc_step": 0, "speed/wps": 5534.375625913279, "speed/FLOPS": 244591075162963.22, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 193.64, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.049052078276872635, "optim/lr": 1.2259209926554603e-05, "optim/total_tokens": 1975894671360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2685641050338745, "created_at": "2025-06-03T08:17:26.266881+00:00"} {"global_step": 235546, "acc_step": 0, "speed/wps": 5518.771195481578, "speed/FLOPS": 243901439208597.44, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04577638581395149, "optim/lr": 1.2255662701460279e-05, "optim/total_tokens": 1975903059968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2596722841262817, "created_at": "2025-06-03T08:17:29.244531+00:00"} {"global_step": 235547, "acc_step": 0, "speed/wps": 5526.658190234676, "speed/FLOPS": 244250004007385.66, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05345390364527702, "optim/lr": 1.2252115476365733e-05, "optim/total_tokens": 1975911448576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.265468955039978, "created_at": "2025-06-03T08:17:32.214401+00:00"} {"global_step": 235548, "acc_step": 0, "speed/wps": 5520.378557505061, "speed/FLOPS": 243972476382810.72, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046869609504938126, "optim/lr": 1.2248568251271186e-05, "optim/total_tokens": 1975919837184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2691820859909058, "created_at": "2025-06-03T08:17:35.189037+00:00"} {"global_step": 235549, "acc_step": 0, "speed/wps": 5516.827591425717, "speed/FLOPS": 243815541857595.78, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05486182123422623, "optim/lr": 1.224502102617664e-05, "optim/total_tokens": 1975928225792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.254528522491455, "created_at": "2025-06-03T08:17:38.169883+00:00"} {"global_step": 235550, "acc_step": 0, "speed/wps": 5512.009597557376, "speed/FLOPS": 243602611189343.25, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04666021466255188, "optim/lr": 1.2241473801082315e-05, "optim/total_tokens": 1975936614400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.25095796585083, "created_at": "2025-06-03T08:17:41.146995+00:00"} {"global_step": 235551, "acc_step": 0, "speed/wps": 5505.328633258998, "speed/FLOPS": 243307346763630.2, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.85 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.85, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04865981638431549, "optim/lr": 1.2237926575987767e-05, "optim/total_tokens": 1975945003008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2674674987792969, "created_at": "2025-06-03T08:17:44.129478+00:00"} {"global_step": 235552, "acc_step": 0, "speed/wps": 5521.16089596072, "speed/FLOPS": 244007051738179.66, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04720825329422951, "optim/lr": 1.223437935089322e-05, "optim/total_tokens": 1975953391616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2553174495697021, "created_at": "2025-06-03T08:17:47.103990+00:00"} {"global_step": 235553, "acc_step": 0, "speed/wps": 5523.682589013631, "speed/FLOPS": 244118497663923.2, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04583079740405083, "optim/lr": 1.2230832125798896e-05, "optim/total_tokens": 1975961780224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2524927854537964, "created_at": "2025-06-03T08:17:50.081522+00:00"} {"global_step": 235554, "acc_step": 0, "speed/wps": 5514.484000097203, "speed/FLOPS": 243711967116463.28, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04646993800997734, "optim/lr": 1.222728490070435e-05, "optim/total_tokens": 1975970168832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.272055983543396, "created_at": "2025-06-03T08:17:53.057654+00:00"} {"global_step": 235555, "acc_step": 0, "speed/wps": 5524.74006241702, "speed/FLOPS": 244165232575713.47, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045696862041950226, "optim/lr": 1.2223737675609804e-05, "optim/total_tokens": 1975978557440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2666232585906982, "created_at": "2025-06-03T08:17:56.032473+00:00"} {"global_step": 235556, "acc_step": 0, "speed/wps": 5523.021116005372, "speed/FLOPS": 244089263942683.94, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04560840502381325, "optim/lr": 1.2220190450515255e-05, "optim/total_tokens": 1975986946048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2686980962753296, "created_at": "2025-06-03T08:17:59.005765+00:00"} {"global_step": 235557, "acc_step": 0, "speed/wps": 5519.566669714934, "speed/FLOPS": 243936595098105.53, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04724039137363434, "optim/lr": 1.2216643225420931e-05, "optim/total_tokens": 1975995334656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2590813636779785, "created_at": "2025-06-03T08:18:01.981433+00:00"} {"global_step": 235558, "acc_step": 0, "speed/wps": 5505.480202735121, "speed/FLOPS": 243314045358671.9, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04588555172085762, "optim/lr": 1.2213096000326385e-05, "optim/total_tokens": 1976003723264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2755186557769775, "created_at": "2025-06-03T08:18:04.962106+00:00"} {"global_step": 235559, "acc_step": 0, "speed/wps": 5510.38752514431, "speed/FLOPS": 243530923891205.0, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047185637056827545, "optim/lr": 1.2209548775231838e-05, "optim/total_tokens": 1976012111872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.261461615562439, "created_at": "2025-06-03T08:18:07.939980+00:00"} {"global_step": 235560, "acc_step": 0, "speed/wps": 5533.181841247571, "speed/FLOPS": 244538315991082.78, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04573837295174599, "optim/lr": 1.2206001550137292e-05, "optim/total_tokens": 1976020500480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.268380880355835, "created_at": "2025-06-03T08:18:10.906667+00:00"} {"global_step": 235561, "acc_step": 0, "speed/wps": 5516.819141002438, "speed/FLOPS": 243815168392140.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04645407199859619, "optim/lr": 1.2202454325042967e-05, "optim/total_tokens": 1976028889088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2652084827423096, "created_at": "2025-06-03T08:18:13.883273+00:00"} {"global_step": 235562, "acc_step": 0, "speed/wps": 5529.45131901879, "speed/FLOPS": 244373446003114.38, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047152068465948105, "optim/lr": 1.219890709994842e-05, "optim/total_tokens": 1976037277696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2664753198623657, "created_at": "2025-06-03T08:18:16.856249+00:00"} {"global_step": 235563, "acc_step": 0, "speed/wps": 5512.681410276409, "speed/FLOPS": 243632301872875.3, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04598604887723923, "optim/lr": 1.2195359874853873e-05, "optim/total_tokens": 1976045666304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2672967910766602, "created_at": "2025-06-03T08:18:19.835766+00:00"} {"global_step": 235564, "acc_step": 0, "speed/wps": 5524.2961881852525, "speed/FLOPS": 244145615606623.6, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045789677649736404, "optim/lr": 1.2191812649759326e-05, "optim/total_tokens": 1976054054912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2622742652893066, "created_at": "2025-06-03T08:18:22.811285+00:00"} {"global_step": 235565, "acc_step": 0, "speed/wps": 5506.811714298462, "speed/FLOPS": 243372891354477.6, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.84 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.84, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04628190025687218, "optim/lr": 1.2188265424665002e-05, "optim/total_tokens": 1976062443520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2665252685546875, "created_at": "2025-06-03T08:18:25.793999+00:00"} {"global_step": 235566, "acc_step": 0, "speed/wps": 5511.280262258979, "speed/FLOPS": 243570378302230.6, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04646604508161545, "optim/lr": 1.2184718199570456e-05, "optim/total_tokens": 1976070832128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2690225839614868, "created_at": "2025-06-03T08:18:28.772173+00:00"} {"global_step": 235567, "acc_step": 0, "speed/wps": 5513.940227174792, "speed/FLOPS": 243687935136574.88, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04566221684217453, "optim/lr": 1.2181170974475907e-05, "optim/total_tokens": 1976079220736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.265684723854065, "created_at": "2025-06-03T08:18:31.748103+00:00"} {"global_step": 235568, "acc_step": 0, "speed/wps": 5523.480933556058, "speed/FLOPS": 244109585524864.66, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04613236337900162, "optim/lr": 1.2177623749381361e-05, "optim/total_tokens": 1976087609344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2690340280532837, "created_at": "2025-06-03T08:18:34.719001+00:00"} {"global_step": 235569, "acc_step": 0, "speed/wps": 5529.4429398051725, "speed/FLOPS": 244373075684761.2, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04829252138733864, "optim/lr": 1.2174076524287037e-05, "optim/total_tokens": 1976095997952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2683002948760986, "created_at": "2025-06-03T08:18:37.686569+00:00"} {"global_step": 235570, "acc_step": 0, "speed/wps": 5533.961828596336, "speed/FLOPS": 244572787439561.0, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04835335910320282, "optim/lr": 1.217052929919249e-05, "optim/total_tokens": 1976104386560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2829540967941284, "created_at": "2025-06-03T08:18:40.651605+00:00"} {"global_step": 235571, "acc_step": 0, "speed/wps": 5521.740342742233, "speed/FLOPS": 244032660320045.03, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04609479755163193, "optim/lr": 1.2166982074097944e-05, "optim/total_tokens": 1976112775168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2827129364013672, "created_at": "2025-06-03T08:18:43.625046+00:00"} {"global_step": 235572, "acc_step": 0, "speed/wps": 5526.154268065183, "speed/FLOPS": 244227733226801.53, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048599112778902054, "optim/lr": 1.2163434849003396e-05, "optim/total_tokens": 1976121163776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2682042121887207, "created_at": "2025-06-03T08:18:46.594161+00:00"} {"global_step": 235573, "acc_step": 0, "speed/wps": 5526.436151044799, "speed/FLOPS": 244240191011692.7, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04636717215180397, "optim/lr": 1.2159887623909071e-05, "optim/total_tokens": 1976129552384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2585915327072144, "created_at": "2025-06-03T08:18:49.566243+00:00"} {"global_step": 235574, "acc_step": 0, "speed/wps": 5517.329467907219, "speed/FLOPS": 243837722229241.44, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.83 hours", "speed/est_time_elapsed_hrs": 194.26, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.83, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04646977037191391, "optim/lr": 1.2156340398814525e-05, "optim/total_tokens": 1976137940992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2499136924743652, "created_at": "2025-06-03T08:18:52.543279+00:00"} {"global_step": 235575, "acc_step": 0, "speed/wps": 5518.281092914298, "speed/FLOPS": 243879779183696.0, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04722609370946884, "optim/lr": 1.2152793173719978e-05, "optim/total_tokens": 1976146329600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2632404565811157, "created_at": "2025-06-03T08:18:55.520333+00:00"} {"global_step": 235576, "acc_step": 0, "speed/wps": 5524.859150954592, "speed/FLOPS": 244170495679523.75, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04575854912400246, "optim/lr": 1.2149245948625432e-05, "optim/total_tokens": 1976154718208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.271579384803772, "created_at": "2025-06-03T08:18:58.490609+00:00"} {"global_step": 235577, "acc_step": 0, "speed/wps": 5533.508508010297, "speed/FLOPS": 244552752989963.2, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04691819101572037, "optim/lr": 1.2145698723531106e-05, "optim/total_tokens": 1976163106816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2571473121643066, "created_at": "2025-06-03T08:19:01.460509+00:00"} {"global_step": 235578, "acc_step": 0, "speed/wps": 5526.706137305472, "speed/FLOPS": 244252123022499.5, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04620567336678505, "optim/lr": 1.214215149843656e-05, "optim/total_tokens": 1976171495424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2846853733062744, "created_at": "2025-06-03T08:19:04.429912+00:00"} {"global_step": 235579, "acc_step": 0, "speed/wps": 5518.214306239448, "speed/FLOPS": 243876827554512.84, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04773276299238205, "optim/lr": 1.2138604273342013e-05, "optim/total_tokens": 1976179884032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2478350400924683, "created_at": "2025-06-03T08:19:07.403347+00:00"} {"global_step": 235580, "acc_step": 0, "speed/wps": 5526.5215081898305, "speed/FLOPS": 244243963360605.62, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046455275267362595, "optim/lr": 1.2135057048247689e-05, "optim/total_tokens": 1976188272640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2747128009796143, "created_at": "2025-06-03T08:19:10.372075+00:00"} {"global_step": 235581, "acc_step": 0, "speed/wps": 5517.534537336348, "speed/FLOPS": 243846785248368.47, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.26, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04811509698629379, "optim/lr": 1.2131509823153142e-05, "optim/total_tokens": 1976196661248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2729545831680298, "created_at": "2025-06-03T08:19:13.346067+00:00"} {"global_step": 235582, "acc_step": 0, "speed/wps": 5510.683877083096, "speed/FLOPS": 243544021130032.62, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04666829854249954, "optim/lr": 1.2127962598058596e-05, "optim/total_tokens": 1976205049856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2733994722366333, "created_at": "2025-06-03T08:19:16.323193+00:00"} {"global_step": 235583, "acc_step": 0, "speed/wps": 5510.883321715741, "speed/FLOPS": 243552835561945.34, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04793921858072281, "optim/lr": 1.2124415372964048e-05, "optim/total_tokens": 1976213438464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2574585676193237, "created_at": "2025-06-03T08:19:19.300413+00:00"} {"global_step": 235584, "acc_step": 0, "speed/wps": 5513.766358653204, "speed/FLOPS": 243680251037860.47, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04592971131205559, "optim/lr": 1.2120868147869723e-05, "optim/total_tokens": 1976221827072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2395131587982178, "created_at": "2025-06-03T08:19:22.276499+00:00"} {"global_step": 235585, "acc_step": 0, "speed/wps": 5520.59123805915, "speed/FLOPS": 243981875774703.72, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04594249278306961, "optim/lr": 1.2117320922775177e-05, "optim/total_tokens": 1976230215680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.265824556350708, "created_at": "2025-06-03T08:19:25.252512+00:00"} {"global_step": 235586, "acc_step": 0, "speed/wps": 5518.032347842155, "speed/FLOPS": 243868785924700.0, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046167436987161636, "optim/lr": 1.211377369768063e-05, "optim/total_tokens": 1976238604288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2790429592132568, "created_at": "2025-06-03T08:19:28.232909+00:00"} {"global_step": 235587, "acc_step": 0, "speed/wps": 5517.16032373858, "speed/FLOPS": 243830246922745.94, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046100445091724396, "optim/lr": 1.2110226472586084e-05, "optim/total_tokens": 1976246992896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2693296670913696, "created_at": "2025-06-03T08:19:31.207246+00:00"} {"global_step": 235588, "acc_step": 0, "speed/wps": 5521.600277002122, "speed/FLOPS": 244026470131253.6, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0454353429377079, "optim/lr": 1.2106679247491758e-05, "optim/total_tokens": 1976255381504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2603641748428345, "created_at": "2025-06-03T08:19:34.179293+00:00"} {"global_step": 235589, "acc_step": 0, "speed/wps": 5535.972624872149, "speed/FLOPS": 244661654342763.6, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 193.54, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04608277231454849, "optim/lr": 1.2103132022397212e-05, "optim/total_tokens": 1976263770112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2616549730300903, "created_at": "2025-06-03T08:19:37.147460+00:00"} {"global_step": 235590, "acc_step": 0, "speed/wps": 5514.526062000585, "speed/FLOPS": 243713826037300.44, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04648499935865402, "optim/lr": 1.2099584797302665e-05, "optim/total_tokens": 1976272158720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2648833990097046, "created_at": "2025-06-03T08:19:40.126964+00:00"} {"global_step": 235591, "acc_step": 0, "speed/wps": 5505.936034812957, "speed/FLOPS": 243334190803352.2, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.82 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.82, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046689972281455994, "optim/lr": 1.2096037572208119e-05, "optim/total_tokens": 1976280547328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2690293788909912, "created_at": "2025-06-03T08:19:43.107554+00:00"} {"global_step": 235592, "acc_step": 0, "speed/wps": 5523.301415260763, "speed/FLOPS": 244101651735070.56, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046236518770456314, "optim/lr": 1.2092490347113794e-05, "optim/total_tokens": 1976288935936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.273871898651123, "created_at": "2025-06-03T08:19:46.078098+00:00"} {"global_step": 235593, "acc_step": 0, "speed/wps": 5530.283888015718, "speed/FLOPS": 244410241291304.12, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04663259536027908, "optim/lr": 1.2088943122019246e-05, "optim/total_tokens": 1976297324544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2667587995529175, "created_at": "2025-06-03T08:19:49.045621+00:00"} {"global_step": 235594, "acc_step": 0, "speed/wps": 5524.063125013322, "speed/FLOPS": 244135315407349.72, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046021003276109695, "optim/lr": 1.20853958969247e-05, "optim/total_tokens": 1976305713152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2629681825637817, "created_at": "2025-06-03T08:19:52.019137+00:00"} {"global_step": 235595, "acc_step": 0, "speed/wps": 5523.862758230381, "speed/FLOPS": 244126460221113.88, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04662198945879936, "optim/lr": 1.2081848671830153e-05, "optim/total_tokens": 1976314101760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.287816047668457, "created_at": "2025-06-03T08:19:54.989610+00:00"} {"global_step": 235596, "acc_step": 0, "speed/wps": 5525.438017608785, "speed/FLOPS": 244196078622730.94, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04844948276877403, "optim/lr": 1.2078301446735829e-05, "optim/total_tokens": 1976322490368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.273248553276062, "created_at": "2025-06-03T08:19:57.961769+00:00"} {"global_step": 235597, "acc_step": 0, "speed/wps": 5517.977207041604, "speed/FLOPS": 243866348983551.8, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.26, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04573023319244385, "optim/lr": 1.2074754221641283e-05, "optim/total_tokens": 1976330878976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2790063619613647, "created_at": "2025-06-03T08:20:00.935531+00:00"} {"global_step": 235598, "acc_step": 0, "speed/wps": 5525.932040676604, "speed/FLOPS": 244217911913689.25, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05054645612835884, "optim/lr": 1.2071206996546734e-05, "optim/total_tokens": 1976339267584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2640535831451416, "created_at": "2025-06-03T08:20:03.908805+00:00"} {"global_step": 235599, "acc_step": 0, "speed/wps": 5509.0462869547955, "speed/FLOPS": 243471648028307.84, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.81 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.81, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0455450676381588, "optim/lr": 1.2067659771452188e-05, "optim/total_tokens": 1976347656192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2683607339859009, "created_at": "2025-06-03T08:20:06.888762+00:00"} {"global_step": 235600, "acc_step": 0, "speed/wps": 5518.969731758134, "speed/FLOPS": 243910213495820.44, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04601912200450897, "optim/lr": 1.2064112546357864e-05, "optim/total_tokens": 1976356044800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2773562669754028, "created_at": "2025-06-03T08:20:09.864786+00:00"} {"global_step": 235601, "acc_step": 0, "speed/wps": 5518.335621389587, "speed/FLOPS": 243882189063201.75, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04796525090932846, "optim/lr": 1.2060565321263317e-05, "optim/total_tokens": 1976364433408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2705365419387817, "created_at": "2025-06-03T08:20:12.839900+00:00"} {"global_step": 235602, "acc_step": 0, "speed/wps": 5523.218302588478, "speed/FLOPS": 244097978580364.78, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05185340344905853, "optim/lr": 1.205701809616877e-05, "optim/total_tokens": 1976372822016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.26681649684906, "created_at": "2025-06-03T08:20:15.810420+00:00"} {"global_step": 235603, "acc_step": 0, "speed/wps": 5510.268317933004, "speed/FLOPS": 243525655542623.1, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0464780293405056, "optim/lr": 1.2053470871074224e-05, "optim/total_tokens": 1976381210624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.262017846107483, "created_at": "2025-06-03T08:20:18.788116+00:00"} {"global_step": 235604, "acc_step": 0, "speed/wps": 5524.557658663236, "speed/FLOPS": 244157171263423.25, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04997241869568825, "optim/lr": 1.2049923645979898e-05, "optim/total_tokens": 1976389599232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2738206386566162, "created_at": "2025-06-03T08:20:21.760820+00:00"} {"global_step": 235605, "acc_step": 0, "speed/wps": 5526.0606587509155, "speed/FLOPS": 244223596174246.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04598066955804825, "optim/lr": 1.2046376420885352e-05, "optim/total_tokens": 1976397987840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2744392156600952, "created_at": "2025-06-03T08:20:24.730154+00:00"} {"global_step": 235606, "acc_step": 0, "speed/wps": 5522.7825047828965, "speed/FLOPS": 244078718547973.47, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04829667881131172, "optim/lr": 1.2042829195790805e-05, "optim/total_tokens": 1976406376448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2594496011734009, "created_at": "2025-06-03T08:20:27.701154+00:00"} {"global_step": 235607, "acc_step": 0, "speed/wps": 5525.751946899108, "speed/FLOPS": 244209952690527.44, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04640273377299309, "optim/lr": 1.2039281970696481e-05, "optim/total_tokens": 1976414765056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2640987634658813, "created_at": "2025-06-03T08:20:30.670529+00:00"} {"global_step": 235608, "acc_step": 0, "speed/wps": 5522.924705959743, "speed/FLOPS": 244085003112138.47, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046441223472356796, "optim/lr": 1.2035734745601935e-05, "optim/total_tokens": 1976423153664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2630003690719604, "created_at": "2025-06-03T08:20:33.641582+00:00"} {"global_step": 235609, "acc_step": 0, "speed/wps": 5515.718345925931, "speed/FLOPS": 243766518884138.4, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04872172325849533, "optim/lr": 1.2032187520507387e-05, "optim/total_tokens": 1976431542272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2637970447540283, "created_at": "2025-06-03T08:20:36.616359+00:00"} {"global_step": 235610, "acc_step": 0, "speed/wps": 5535.56021601419, "speed/FLOPS": 244643427982141.7, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 193.57, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04576915502548218, "optim/lr": 1.202864029541284e-05, "optim/total_tokens": 1976439930880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.264227271080017, "created_at": "2025-06-03T08:20:39.580975+00:00"} {"global_step": 235611, "acc_step": 0, "speed/wps": 5515.570352492677, "speed/FLOPS": 243759978331887.6, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.8 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.8, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04701140522956848, "optim/lr": 1.2025093070318516e-05, "optim/total_tokens": 1976448319488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2466473579406738, "created_at": "2025-06-03T08:20:42.558135+00:00"} {"global_step": 235612, "acc_step": 0, "speed/wps": 5523.578653332369, "speed/FLOPS": 244113904238802.47, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048295069485902786, "optim/lr": 1.202154584522397e-05, "optim/total_tokens": 1976456708096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2568082809448242, "created_at": "2025-06-03T08:20:45.533218+00:00"} {"global_step": 235613, "acc_step": 0, "speed/wps": 5513.724725243729, "speed/FLOPS": 243678411054260.75, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04622191935777664, "optim/lr": 1.2017998620129423e-05, "optim/total_tokens": 1976465096704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2685348987579346, "created_at": "2025-06-03T08:20:48.509447+00:00"} {"global_step": 235614, "acc_step": 0, "speed/wps": 5525.069417889795, "speed/FLOPS": 244179788401815.97, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05346783250570297, "optim/lr": 1.2014451395034875e-05, "optim/total_tokens": 1976473485312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2722582817077637, "created_at": "2025-06-03T08:20:51.479241+00:00"} {"global_step": 235615, "acc_step": 0, "speed/wps": 5529.5207308200115, "speed/FLOPS": 244376513649446.56, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046795718371868134, "optim/lr": 1.201090416994055e-05, "optim/total_tokens": 1976481873920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.269692301750183, "created_at": "2025-06-03T08:20:54.446460+00:00"} {"global_step": 235616, "acc_step": 0, "speed/wps": 5518.949588779614, "speed/FLOPS": 243909323279270.94, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0458868183195591, "optim/lr": 1.2007356944846004e-05, "optim/total_tokens": 1976490262528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2750753164291382, "created_at": "2025-06-03T08:20:57.422915+00:00"} {"global_step": 235617, "acc_step": 0, "speed/wps": 5518.5323307218705, "speed/FLOPS": 243890882608839.03, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04557042568922043, "optim/lr": 1.2003809719751458e-05, "optim/total_tokens": 1976498651136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.265047550201416, "created_at": "2025-06-03T08:21:00.401365+00:00"} {"global_step": 235618, "acc_step": 0, "speed/wps": 5515.261564480311, "speed/FLOPS": 243746331482261.38, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04634307324886322, "optim/lr": 1.2000262494656911e-05, "optim/total_tokens": 1976507039744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2778269052505493, "created_at": "2025-06-03T08:21:03.378984+00:00"} {"global_step": 235619, "acc_step": 0, "speed/wps": 5526.009105004812, "speed/FLOPS": 244221317762545.06, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04661775380373001, "optim/lr": 1.1996715269562587e-05, "optim/total_tokens": 1976515428352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2664448022842407, "created_at": "2025-06-03T08:21:06.349299+00:00"} {"global_step": 235620, "acc_step": 0, "speed/wps": 5534.046987943599, "speed/FLOPS": 244576551046824.97, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0468282625079155, "optim/lr": 1.1993168044468039e-05, "optim/total_tokens": 1976523816960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.264130711555481, "created_at": "2025-06-03T08:21:09.315214+00:00"} {"global_step": 235621, "acc_step": 0, "speed/wps": 5522.636361998336, "speed/FLOPS": 244072259784922.47, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047137510031461716, "optim/lr": 1.1989620819373492e-05, "optim/total_tokens": 1976532205568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2921677827835083, "created_at": "2025-06-03T08:21:12.289357+00:00"} {"global_step": 235622, "acc_step": 0, "speed/wps": 5527.779660754487, "speed/FLOPS": 244299567264154.8, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04697144404053688, "optim/lr": 1.1986073594278946e-05, "optim/total_tokens": 1976540594176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2563045024871826, "created_at": "2025-06-03T08:21:15.258254+00:00"} {"global_step": 235623, "acc_step": 0, "speed/wps": 5525.79252112874, "speed/FLOPS": 244211745863799.44, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04980802908539772, "optim/lr": 1.1982526369184621e-05, "optim/total_tokens": 1976548982784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2660895586013794, "created_at": "2025-06-03T08:21:18.231209+00:00"} {"global_step": 235624, "acc_step": 0, "speed/wps": 5510.621761760181, "speed/FLOPS": 243541275950694.78, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04551144689321518, "optim/lr": 1.1978979144090075e-05, "optim/total_tokens": 1976557371392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2530620098114014, "created_at": "2025-06-03T08:21:21.213454+00:00"} {"global_step": 235625, "acc_step": 0, "speed/wps": 5503.83306842102, "speed/FLOPS": 243241250452786.34, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.79 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.79, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04931245371699333, "optim/lr": 1.1975431918995527e-05, "optim/total_tokens": 1976565760000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2714186906814575, "created_at": "2025-06-03T08:21:24.195729+00:00"} {"global_step": 235626, "acc_step": 0, "speed/wps": 5518.22914892932, "speed/FLOPS": 243877483525433.4, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04688369110226631, "optim/lr": 1.197188469390098e-05, "optim/total_tokens": 1976574148608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2565207481384277, "created_at": "2025-06-03T08:21:27.173564+00:00"} {"global_step": 235627, "acc_step": 0, "speed/wps": 5516.680511564336, "speed/FLOPS": 243809041680545.7, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04637523740530014, "optim/lr": 1.1968337468806656e-05, "optim/total_tokens": 1976582537216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2620718479156494, "created_at": "2025-06-03T08:21:30.148006+00:00"} {"global_step": 235628, "acc_step": 0, "speed/wps": 5536.547468996884, "speed/FLOPS": 244687059510757.94, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04958895593881607, "optim/lr": 1.196479024371211e-05, "optim/total_tokens": 1976590925824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2692017555236816, "created_at": "2025-06-03T08:21:33.116464+00:00"} {"global_step": 235629, "acc_step": 0, "speed/wps": 5534.558192779531, "speed/FLOPS": 244599143683989.62, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 193.7, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046077143400907516, "optim/lr": 1.1961243018617563e-05, "optim/total_tokens": 1976599314432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.284471035003662, "created_at": "2025-06-03T08:21:36.087613+00:00"} {"global_step": 235630, "acc_step": 0, "speed/wps": 5518.8325523958465, "speed/FLOPS": 243904150870154.94, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048520028591156006, "optim/lr": 1.1957695793523015e-05, "optim/total_tokens": 1976607703040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.278253197669983, "created_at": "2025-06-03T08:21:39.061288+00:00"} {"global_step": 235631, "acc_step": 0, "speed/wps": 5525.731693201858, "speed/FLOPS": 244209057580776.84, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046280279755592346, "optim/lr": 1.195414856842869e-05, "optim/total_tokens": 1976616091648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.263587236404419, "created_at": "2025-06-03T08:21:42.033276+00:00"} {"global_step": 235632, "acc_step": 0, "speed/wps": 5525.681413021643, "speed/FLOPS": 244206835454168.6, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05017971619963646, "optim/lr": 1.1950601343334144e-05, "optim/total_tokens": 1976624480256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.263606309890747, "created_at": "2025-06-03T08:21:45.007571+00:00"} {"global_step": 235633, "acc_step": 0, "speed/wps": 5510.481086650993, "speed/FLOPS": 243535058830909.2, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04693730175495148, "optim/lr": 1.1947054118239598e-05, "optim/total_tokens": 1976632868864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2736939191818237, "created_at": "2025-06-03T08:21:47.985515+00:00"} {"global_step": 235634, "acc_step": 0, "speed/wps": 5517.600658606493, "speed/FLOPS": 243849707470069.53, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.046140220016241074, "optim/lr": 1.1943506893145273e-05, "optim/total_tokens": 1976641257472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2741591930389404, "created_at": "2025-06-03T08:21:50.959636+00:00"} {"global_step": 235635, "acc_step": 0, "speed/wps": 5513.003679232788, "speed/FLOPS": 243646544511225.22, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.78 hours", "speed/est_time_elapsed_hrs": 194.46, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.78, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0532701276242733, "optim/lr": 1.1939959668050725e-05, "optim/total_tokens": 1976649646080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.271653413772583, "created_at": "2025-06-03T08:21:53.939362+00:00"} {"global_step": 235636, "acc_step": 0, "speed/wps": 5537.621742399608, "speed/FLOPS": 244734536896528.56, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 193.6, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045973747968673706, "optim/lr": 1.1936412442956179e-05, "optim/total_tokens": 1976658034688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2672291994094849, "created_at": "2025-06-03T08:21:56.902947+00:00"} {"global_step": 235637, "acc_step": 0, "speed/wps": 5516.744283354537, "speed/FLOPS": 243811860067259.0, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.048912644386291504, "optim/lr": 1.1932865217861632e-05, "optim/total_tokens": 1976666423296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2899237871170044, "created_at": "2025-06-03T08:21:59.877375+00:00"} {"global_step": 235638, "acc_step": 0, "speed/wps": 5530.1171738007115, "speed/FLOPS": 244402873376321.56, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04940851777791977, "optim/lr": 1.1929317992767308e-05, "optim/total_tokens": 1976674811904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2665786743164062, "created_at": "2025-06-03T08:22:02.847111+00:00"} {"global_step": 235639, "acc_step": 0, "speed/wps": 5523.833895555496, "speed/FLOPS": 244125184638616.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04785367101430893, "optim/lr": 1.1925770767672762e-05, "optim/total_tokens": 1976683200512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2699105739593506, "created_at": "2025-06-03T08:22:05.817664+00:00"} {"global_step": 235640, "acc_step": 0, "speed/wps": 5517.140537852433, "speed/FLOPS": 243829372487851.62, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.045971374958753586, "optim/lr": 1.1922223542578215e-05, "optim/total_tokens": 1976691589120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.283286213874817, "created_at": "2025-06-03T08:22:08.792212+00:00"} {"global_step": 235641, "acc_step": 0, "speed/wps": 5522.202350006021, "speed/FLOPS": 244053078676336.9, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04688334837555885, "optim/lr": 1.1918676317483667e-05, "optim/total_tokens": 1976699977728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2624669075012207, "created_at": "2025-06-03T08:22:11.763679+00:00"} {"global_step": 235642, "acc_step": 0, "speed/wps": 5513.601321803864, "speed/FLOPS": 243672957253854.78, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.047973766922950745, "optim/lr": 1.1915129092389343e-05, "optim/total_tokens": 1976708366336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2653720378875732, "created_at": "2025-06-03T08:22:14.742794+00:00"} {"global_step": 235643, "acc_step": 0, "speed/wps": 5513.178833490266, "speed/FLOPS": 243654285432884.97, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.0466943196952343, "optim/lr": 1.1911581867294796e-05, "optim/total_tokens": 1976716754944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2796385288238525, "created_at": "2025-06-03T08:22:17.718843+00:00"} {"global_step": 235644, "acc_step": 0, "speed/wps": 5518.310237727954, "speed/FLOPS": 243881067235282.9, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04837217181921005, "optim/lr": 1.190803464220025e-05, "optim/total_tokens": 1976725143552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2772375345230103, "created_at": "2025-06-03T08:22:20.692315+00:00"} {"global_step": 235645, "acc_step": 0, "speed/wps": 5517.739930493839, "speed/FLOPS": 243855862574632.1, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.050501659512519836, "optim/lr": 1.1904487417105703e-05, "optim/total_tokens": 1976733532160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.257399559020996, "created_at": "2025-06-03T08:22:23.670415+00:00"} {"global_step": 235646, "acc_step": 0, "speed/wps": 5522.461712329926, "speed/FLOPS": 244064541163516.78, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04854969680309296, "optim/lr": 1.1900940192011377e-05, "optim/total_tokens": 1976741920768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2595281600952148, "created_at": "2025-06-03T08:22:26.642824+00:00"} {"global_step": 235647, "acc_step": 0, "speed/wps": 5524.456385120169, "speed/FLOPS": 244152695491184.66, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05542585626244545, "optim/lr": 1.1897392966916831e-05, "optim/total_tokens": 1976750309376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2755745649337769, "created_at": "2025-06-03T08:22:29.613256+00:00"} {"global_step": 235648, "acc_step": 0, "speed/wps": 5515.692834154913, "speed/FLOPS": 243765391394440.47, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05065927281975746, "optim/lr": 1.1893845741822285e-05, "optim/total_tokens": 1976758697984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2629797458648682, "created_at": "2025-06-03T08:22:32.591285+00:00"} {"global_step": 235649, "acc_step": 0, "speed/wps": 5513.819367019373, "speed/FLOPS": 243682593736323.72, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.050945837050676346, "optim/lr": 1.1890298516727738e-05, "optim/total_tokens": 1976767086592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2810181379318237, "created_at": "2025-06-03T08:22:35.568126+00:00"} {"global_step": 235650, "acc_step": 0, "speed/wps": 5507.592798695545, "speed/FLOPS": 243407411286876.3, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.77 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.77, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.04693162813782692, "optim/lr": 1.1886751291633414e-05, "optim/total_tokens": 1976775475200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2704761028289795, "created_at": "2025-06-03T08:22:38.550924+00:00"} {"global_step": 235651, "acc_step": 0, "speed/wps": 5516.5559266097025, "speed/FLOPS": 243803535663234.5, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.12, "optim/grad_norm": 0.05193117633461952, "optim/lr": 1.1883204066538866e-05, "optim/total_tokens": 1976783863808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2566007375717163, "created_at": "2025-06-03T08:22:41.525342+00:00"} {"global_step": 235652, "acc_step": 0, "speed/wps": 5525.873465257696, "speed/FLOPS": 244215323179989.7, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04791831970214844, "optim/lr": 1.187965684144432e-05, "optim/total_tokens": 1976792252416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2672003507614136, "created_at": "2025-06-03T08:22:44.498642+00:00"} {"global_step": 235653, "acc_step": 0, "speed/wps": 5529.762628821328, "speed/FLOPS": 244387204302958.53, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04913526773452759, "optim/lr": 1.1876109616349773e-05, "optim/total_tokens": 1976800641024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.266935110092163, "created_at": "2025-06-03T08:22:47.471079+00:00"} {"global_step": 235654, "acc_step": 0, "speed/wps": 5516.256071056436, "speed/FLOPS": 243790283582579.97, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05218568071722984, "optim/lr": 1.1872562391255448e-05, "optim/total_tokens": 1976809029632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2567472457885742, "created_at": "2025-06-03T08:22:50.445754+00:00"} {"global_step": 235655, "acc_step": 0, "speed/wps": 5515.385686789649, "speed/FLOPS": 243751817053018.56, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047024454921483994, "optim/lr": 1.1869015166160902e-05, "optim/total_tokens": 1976817418240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2602661848068237, "created_at": "2025-06-03T08:22:53.421149+00:00"} {"global_step": 235656, "acc_step": 0, "speed/wps": 5518.135659057582, "speed/FLOPS": 243873351751627.12, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05348612740635872, "optim/lr": 1.1865467941066354e-05, "optim/total_tokens": 1976825806848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2563883066177368, "created_at": "2025-06-03T08:22:56.394275+00:00"} {"global_step": 235657, "acc_step": 0, "speed/wps": 5511.622134315246, "speed/FLOPS": 243585487297257.75, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047447916120290756, "optim/lr": 1.1861920715971807e-05, "optim/total_tokens": 1976834195456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2643733024597168, "created_at": "2025-06-03T08:22:59.371294+00:00"} {"global_step": 235658, "acc_step": 0, "speed/wps": 5511.943274322273, "speed/FLOPS": 243599680041824.8, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048488810658454895, "optim/lr": 1.1858373490877483e-05, "optim/total_tokens": 1976842584064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2695103883743286, "created_at": "2025-06-03T08:23:02.348190+00:00"} {"global_step": 235659, "acc_step": 0, "speed/wps": 5513.497730167377, "speed/FLOPS": 243668379033752.12, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.76 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.76, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05096384510397911, "optim/lr": 1.1854826265782937e-05, "optim/total_tokens": 1976850972672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.267026424407959, "created_at": "2025-06-03T08:23:05.325423+00:00"} {"global_step": 235660, "acc_step": 0, "speed/wps": 5515.834949340657, "speed/FLOPS": 243771672158238.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.045855987817049026, "optim/lr": 1.185127904068839e-05, "optim/total_tokens": 1976859361280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.277662754058838, "created_at": "2025-06-03T08:23:08.300240+00:00"} {"global_step": 235661, "acc_step": 0, "speed/wps": 5518.699727390253, "speed/FLOPS": 243898280684767.75, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05853865295648575, "optim/lr": 1.1847731815594066e-05, "optim/total_tokens": 1976867749888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2702981233596802, "created_at": "2025-06-03T08:23:11.277385+00:00"} {"global_step": 235662, "acc_step": 0, "speed/wps": 5526.9861244092235, "speed/FLOPS": 244264497019381.4, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047174323350191116, "optim/lr": 1.1844184590499518e-05, "optim/total_tokens": 1976876138496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2725623846054077, "created_at": "2025-06-03T08:23:14.246850+00:00"} {"global_step": 235663, "acc_step": 0, "speed/wps": 5532.028710684185, "speed/FLOPS": 244487353522438.38, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05295135825872421, "optim/lr": 1.1840637365404971e-05, "optim/total_tokens": 1976884527104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2666974067687988, "created_at": "2025-06-03T08:23:17.213106+00:00"} {"global_step": 235664, "acc_step": 0, "speed/wps": 5523.117968552193, "speed/FLOPS": 244093544329517.12, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.054207053035497665, "optim/lr": 1.1837090140310425e-05, "optim/total_tokens": 1976892915712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2564349174499512, "created_at": "2025-06-03T08:23:20.187383+00:00"} {"global_step": 235665, "acc_step": 0, "speed/wps": 5535.8459772575825, "speed/FLOPS": 244656057166441.0, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046854931861162186, "optim/lr": 1.18335429152161e-05, "optim/total_tokens": 1976901304320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2567168474197388, "created_at": "2025-06-03T08:23:23.151264+00:00"} {"global_step": 235666, "acc_step": 0, "speed/wps": 5516.283109317505, "speed/FLOPS": 243791478535324.84, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.058990418910980225, "optim/lr": 1.1829995690121554e-05, "optim/total_tokens": 1976909692928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.258108139038086, "created_at": "2025-06-03T08:23:26.126562+00:00"} {"global_step": 235667, "acc_step": 0, "speed/wps": 5528.090666831772, "speed/FLOPS": 244313312140897.4, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04807873070240021, "optim/lr": 1.1826448465027006e-05, "optim/total_tokens": 1976918081536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.276339054107666, "created_at": "2025-06-03T08:23:29.098221+00:00"} {"global_step": 235668, "acc_step": 0, "speed/wps": 5527.49375777061, "speed/FLOPS": 244286931815651.56, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049029041081666946, "optim/lr": 1.182290123993246e-05, "optim/total_tokens": 1976926470144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.277237892150879, "created_at": "2025-06-03T08:23:32.070790+00:00"} {"global_step": 235669, "acc_step": 0, "speed/wps": 5518.349189413196, "speed/FLOPS": 243882788700397.8, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05783623456954956, "optim/lr": 1.1819354014838135e-05, "optim/total_tokens": 1976934858752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2598648071289062, "created_at": "2025-06-03T08:23:35.049189+00:00"} {"global_step": 235670, "acc_step": 0, "speed/wps": 5516.662077613326, "speed/FLOPS": 243808226994264.56, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04762447997927666, "optim/lr": 1.1815806789743589e-05, "optim/total_tokens": 1976943247360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.282416820526123, "created_at": "2025-06-03T08:23:38.024320+00:00"} {"global_step": 235671, "acc_step": 0, "speed/wps": 5520.415645853673, "speed/FLOPS": 243974115497984.0, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05206645280122757, "optim/lr": 1.1812259564649042e-05, "optim/total_tokens": 1976951635968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2809056043624878, "created_at": "2025-06-03T08:23:41.000373+00:00"} {"global_step": 235672, "acc_step": 0, "speed/wps": 5509.594114524581, "speed/FLOPS": 243495859202856.66, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.75 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.75, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04769239202141762, "optim/lr": 1.1808712339554494e-05, "optim/total_tokens": 1976960024576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2625293731689453, "created_at": "2025-06-03T08:23:43.983956+00:00"} {"global_step": 235673, "acc_step": 0, "speed/wps": 5518.655328297313, "speed/FLOPS": 243896318472114.94, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047405894845724106, "optim/lr": 1.180516511446017e-05, "optim/total_tokens": 1976968413184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2572849988937378, "created_at": "2025-06-03T08:23:46.959267+00:00"} {"global_step": 235674, "acc_step": 0, "speed/wps": 5521.757645973394, "speed/FLOPS": 244033425034296.38, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048560552299022675, "optim/lr": 1.1801617889365623e-05, "optim/total_tokens": 1976976801792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2681187391281128, "created_at": "2025-06-03T08:23:49.930786+00:00"} {"global_step": 235675, "acc_step": 0, "speed/wps": 5516.148865903008, "speed/FLOPS": 243785545663524.2, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04716448858380318, "optim/lr": 1.1798070664271077e-05, "optim/total_tokens": 1976985190400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2765896320343018, "created_at": "2025-06-03T08:23:52.905871+00:00"} {"global_step": 235676, "acc_step": 0, "speed/wps": 5519.544785426945, "speed/FLOPS": 243935627924590.38, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.045624975115060806, "optim/lr": 1.179452343917653e-05, "optim/total_tokens": 1976993579008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2647733688354492, "created_at": "2025-06-03T08:23:55.883648+00:00"} {"global_step": 235677, "acc_step": 0, "speed/wps": 5521.079476017404, "speed/FLOPS": 244003453393430.12, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049193125218153, "optim/lr": 1.1790976214082206e-05, "optim/total_tokens": 1977001967616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2743300199508667, "created_at": "2025-06-03T08:23:58.859177+00:00"} {"global_step": 235678, "acc_step": 0, "speed/wps": 5530.840725224798, "speed/FLOPS": 244434850645794.28, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04662388935685158, "optim/lr": 1.1787428988987658e-05, "optim/total_tokens": 1977010356224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2797081470489502, "created_at": "2025-06-03T08:24:01.826318+00:00"} {"global_step": 235679, "acc_step": 0, "speed/wps": 5525.304641921585, "speed/FLOPS": 244190184100035.34, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04724188148975372, "optim/lr": 1.1783881763893112e-05, "optim/total_tokens": 1977018744832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2608559131622314, "created_at": "2025-06-03T08:24:04.795969+00:00"} {"global_step": 235680, "acc_step": 0, "speed/wps": 5529.849448917867, "speed/FLOPS": 244391041306840.03, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049466218799352646, "optim/lr": 1.1780334538798565e-05, "optim/total_tokens": 1977027133440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2735823392868042, "created_at": "2025-06-03T08:24:07.765219+00:00"} {"global_step": 235681, "acc_step": 0, "speed/wps": 5522.791113055297, "speed/FLOPS": 244079098989552.4, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04809657111763954, "optim/lr": 1.177678731370424e-05, "optim/total_tokens": 1977035522048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2582021951675415, "created_at": "2025-06-03T08:24:10.736888+00:00"} {"global_step": 235682, "acc_step": 0, "speed/wps": 5525.631197105019, "speed/FLOPS": 244204616167682.2, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05211781710386276, "optim/lr": 1.1773240088609694e-05, "optim/total_tokens": 1977043910656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.27418053150177, "created_at": "2025-06-03T08:24:13.709670+00:00"} {"global_step": 235683, "acc_step": 0, "speed/wps": 5522.6943239834, "speed/FLOPS": 244074821407985.97, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04609755426645279, "optim/lr": 1.1769692863515146e-05, "optim/total_tokens": 1977052299264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.255049467086792, "created_at": "2025-06-03T08:24:16.684353+00:00"} {"global_step": 235684, "acc_step": 0, "speed/wps": 5520.110442710295, "speed/FLOPS": 243960627081217.97, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.050330206751823425, "optim/lr": 1.17661456384206e-05, "optim/total_tokens": 1977060687872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2599377632141113, "created_at": "2025-06-03T08:24:19.656677+00:00"} {"global_step": 235685, "acc_step": 0, "speed/wps": 5513.773637986785, "speed/FLOPS": 243680572747145.7, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.74 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.74, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0509115494787693, "optim/lr": 1.1762598413326275e-05, "optim/total_tokens": 1977069076480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.274018406867981, "created_at": "2025-06-03T08:24:22.637432+00:00"} {"global_step": 235686, "acc_step": 0, "speed/wps": 5522.236807224757, "speed/FLOPS": 244054601509037.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04789166897535324, "optim/lr": 1.1759051188231729e-05, "optim/total_tokens": 1977077465088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2705342769622803, "created_at": "2025-06-03T08:24:25.611508+00:00"} {"global_step": 235687, "acc_step": 0, "speed/wps": 5518.738584594531, "speed/FLOPS": 243899997974307.62, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04856904596090317, "optim/lr": 1.1755503963137183e-05, "optim/total_tokens": 1977085853696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2787033319473267, "created_at": "2025-06-03T08:24:28.584941+00:00"} {"global_step": 235688, "acc_step": 0, "speed/wps": 5526.074342902025, "speed/FLOPS": 244224200943684.03, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048360712826251984, "optim/lr": 1.1751956738042856e-05, "optim/total_tokens": 1977094242304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2384839057922363, "created_at": "2025-06-03T08:24:31.554495+00:00"} {"global_step": 235689, "acc_step": 0, "speed/wps": 5522.537730295325, "speed/FLOPS": 244067900768492.2, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04764154553413391, "optim/lr": 1.174840951294831e-05, "optim/total_tokens": 1977102630912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2766278982162476, "created_at": "2025-06-03T08:24:34.526006+00:00"} {"global_step": 235690, "acc_step": 0, "speed/wps": 5518.347081914321, "speed/FLOPS": 243882695559734.72, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049011021852493286, "optim/lr": 1.1744862287853764e-05, "optim/total_tokens": 1977111019520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2489356994628906, "created_at": "2025-06-03T08:24:37.499282+00:00"} {"global_step": 235691, "acc_step": 0, "speed/wps": 5517.753148596597, "speed/FLOPS": 243856446747117.62, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04706936702132225, "optim/lr": 1.1741315062759217e-05, "optim/total_tokens": 1977119408128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2739489078521729, "created_at": "2025-06-03T08:24:40.473794+00:00"} {"global_step": 235692, "acc_step": 0, "speed/wps": 5517.0119596528775, "speed/FLOPS": 243823689989554.12, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04895874485373497, "optim/lr": 1.1737767837664893e-05, "optim/total_tokens": 1977127796736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2563457489013672, "created_at": "2025-06-03T08:24:43.448578+00:00"} {"global_step": 235693, "acc_step": 0, "speed/wps": 5508.862897089353, "speed/FLOPS": 243463543134929.72, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04742870107293129, "optim/lr": 1.1734220612570346e-05, "optim/total_tokens": 1977136185344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2765241861343384, "created_at": "2025-06-03T08:24:46.426964+00:00"} {"global_step": 235694, "acc_step": 0, "speed/wps": 5523.230990315389, "speed/FLOPS": 244098539312952.6, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04690214619040489, "optim/lr": 1.1730673387475798e-05, "optim/total_tokens": 1977144573952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2731053829193115, "created_at": "2025-06-03T08:24:49.401505+00:00"} {"global_step": 235695, "acc_step": 0, "speed/wps": 5537.712131946855, "speed/FLOPS": 244738531651861.25, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047776054590940475, "optim/lr": 1.1727126162381252e-05, "optim/total_tokens": 1977152962560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2720611095428467, "created_at": "2025-06-03T08:24:52.367396+00:00"} {"global_step": 235696, "acc_step": 0, "speed/wps": 5517.7974847156265, "speed/FLOPS": 243858406176645.88, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.045826300978660583, "optim/lr": 1.1723578937286927e-05, "optim/total_tokens": 1977161351168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2768127918243408, "created_at": "2025-06-03T08:24:55.344060+00:00"} {"global_step": 235697, "acc_step": 0, "speed/wps": 5520.207966613881, "speed/FLOPS": 243964937138583.9, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0486939363181591, "optim/lr": 1.1720031712192381e-05, "optim/total_tokens": 1977169739776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2870702743530273, "created_at": "2025-06-03T08:24:58.316443+00:00"} {"global_step": 235698, "acc_step": 0, "speed/wps": 5518.570406120891, "speed/FLOPS": 243892565346588.2, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05016954615712166, "optim/lr": 1.1716484487097835e-05, "optim/total_tokens": 1977178128384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2596901655197144, "created_at": "2025-06-03T08:25:01.289546+00:00"} {"global_step": 235699, "acc_step": 0, "speed/wps": 5524.315643349835, "speed/FLOPS": 244146475425317.6, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046338699758052826, "optim/lr": 1.1712937262003286e-05, "optim/total_tokens": 1977186516992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2672703266143799, "created_at": "2025-06-03T08:25:04.260905+00:00"} {"global_step": 235700, "acc_step": 0, "speed/wps": 5531.891314513191, "speed/FLOPS": 244481281314937.78, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 193.86, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04605575278401375, "optim/lr": 1.1709390036908962e-05, "optim/total_tokens": 1977194905600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2655647993087769, "created_at": "2025-06-03T08:25:07.232219+00:00"} {"global_step": 235701, "acc_step": 0, "speed/wps": 5505.637447630691, "speed/FLOPS": 243320994778203.78, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.73 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.73, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04888549819588661, "optim/lr": 1.1705842811814416e-05, "optim/total_tokens": 1977203294208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2609158754348755, "created_at": "2025-06-03T08:25:10.213251+00:00"} {"global_step": 235702, "acc_step": 0, "speed/wps": 5531.459097344436, "speed/FLOPS": 244462179528366.8, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046863406896591187, "optim/lr": 1.170229558671987e-05, "optim/total_tokens": 1977211682816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2688287496566772, "created_at": "2025-06-03T08:25:13.181274+00:00"} {"global_step": 235703, "acc_step": 0, "speed/wps": 5515.314024511858, "speed/FLOPS": 243748649947140.97, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0488533154129982, "optim/lr": 1.1698748361625323e-05, "optim/total_tokens": 1977220071424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2578628063201904, "created_at": "2025-06-03T08:25:16.156415+00:00"} {"global_step": 235704, "acc_step": 0, "speed/wps": 5524.9910111486415, "speed/FLOPS": 244176323225179.06, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.03, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046532776206731796, "optim/lr": 1.1695201136530997e-05, "optim/total_tokens": 1977228460032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2562613487243652, "created_at": "2025-06-03T08:25:19.126494+00:00"} {"global_step": 235705, "acc_step": 0, "speed/wps": 5519.958173999751, "speed/FLOPS": 243953897583593.88, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046403758227825165, "optim/lr": 1.169165391143645e-05, "optim/total_tokens": 1977236848640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2684255838394165, "created_at": "2025-06-03T08:25:22.100209+00:00"} {"global_step": 235706, "acc_step": 0, "speed/wps": 5522.517432975652, "speed/FLOPS": 244067003730853.75, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04680914431810379, "optim/lr": 1.1688106686341904e-05, "optim/total_tokens": 1977245237248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2769782543182373, "created_at": "2025-06-03T08:25:25.072167+00:00"} {"global_step": 235707, "acc_step": 0, "speed/wps": 5526.015359586514, "speed/FLOPS": 244221594183042.44, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04765499010682106, "optim/lr": 1.1684559461247357e-05, "optim/total_tokens": 1977253625856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2660397291183472, "created_at": "2025-06-03T08:25:28.044917+00:00"} {"global_step": 235708, "acc_step": 0, "speed/wps": 5508.672649849035, "speed/FLOPS": 243455135180681.3, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.72 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.72, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.057605791836977005, "optim/lr": 1.1681012236153033e-05, "optim/total_tokens": 1977262014464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2588392496109009, "created_at": "2025-06-03T08:25:31.026165+00:00"} {"global_step": 235709, "acc_step": 0, "speed/wps": 5517.906055034742, "speed/FLOPS": 243863204429037.53, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04901592805981636, "optim/lr": 1.1677465011058485e-05, "optim/total_tokens": 1977270403072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2603434324264526, "created_at": "2025-06-03T08:25:34.000520+00:00"} {"global_step": 235710, "acc_step": 0, "speed/wps": 5521.616840640021, "speed/FLOPS": 244027202159268.3, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04778720438480377, "optim/lr": 1.1673917785963939e-05, "optim/total_tokens": 1977278791680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2708988189697266, "created_at": "2025-06-03T08:25:36.977467+00:00"} {"global_step": 235711, "acc_step": 0, "speed/wps": 5532.072084870263, "speed/FLOPS": 244489270439453.8, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 193.79, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04950566589832306, "optim/lr": 1.1670370560869392e-05, "optim/total_tokens": 1977287180288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2695319652557373, "created_at": "2025-06-03T08:25:39.943766+00:00"} {"global_step": 235712, "acc_step": 0, "speed/wps": 5533.678041199523, "speed/FLOPS": 244560245489177.47, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 193.8, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04808736965060234, "optim/lr": 1.1666823335775068e-05, "optim/total_tokens": 1977295568896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.263427495956421, "created_at": "2025-06-03T08:25:42.908889+00:00"} {"global_step": 235713, "acc_step": 0, "speed/wps": 5518.252738152217, "speed/FLOPS": 243878526048344.84, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05008753761649132, "optim/lr": 1.1663276110680521e-05, "optim/total_tokens": 1977303957504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2667728662490845, "created_at": "2025-06-03T08:25:45.882732+00:00"} {"global_step": 235714, "acc_step": 0, "speed/wps": 5525.546229316007, "speed/FLOPS": 244200861026312.44, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04835565760731697, "optim/lr": 1.1659728885585973e-05, "optim/total_tokens": 1977312346112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2664198875427246, "created_at": "2025-06-03T08:25:48.855634+00:00"} {"global_step": 235715, "acc_step": 0, "speed/wps": 5528.391890339057, "speed/FLOPS": 244326624678117.72, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04599432274699211, "optim/lr": 1.1656181660491649e-05, "optim/total_tokens": 1977320734720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.265039324760437, "created_at": "2025-06-03T08:25:51.824134+00:00"} {"global_step": 235716, "acc_step": 0, "speed/wps": 5514.797228279153, "speed/FLOPS": 243725810198858.34, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04713376611471176, "optim/lr": 1.1652634435397102e-05, "optim/total_tokens": 1977329123328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.257540225982666, "created_at": "2025-06-03T08:25:54.799458+00:00"} {"global_step": 235717, "acc_step": 0, "speed/wps": 5514.122177204141, "speed/FLOPS": 243695976396567.4, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04984770715236664, "optim/lr": 1.1649087210302556e-05, "optim/total_tokens": 1977337511936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264069676399231, "created_at": "2025-06-03T08:25:57.775056+00:00"} {"global_step": 235718, "acc_step": 0, "speed/wps": 5524.260320957914, "speed/FLOPS": 244144030458760.34, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04698000103235245, "optim/lr": 1.164553998520801e-05, "optim/total_tokens": 1977345900544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.274303674697876, "created_at": "2025-06-03T08:26:00.745220+00:00"} {"global_step": 235719, "acc_step": 0, "speed/wps": 5503.420932339312, "speed/FLOPS": 243223036147478.53, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04635054990649223, "optim/lr": 1.1641992760113685e-05, "optim/total_tokens": 1977354289152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2643463611602783, "created_at": "2025-06-03T08:26:03.726740+00:00"} {"global_step": 235720, "acc_step": 0, "speed/wps": 5515.228588298631, "speed/FLOPS": 243744874103818.5, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.71 hours", "speed/est_time_elapsed_hrs": 194.46, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.71, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0462673082947731, "optim/lr": 1.1638445535019137e-05, "optim/total_tokens": 1977362677760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2736326456069946, "created_at": "2025-06-03T08:26:06.702218+00:00"} {"global_step": 235721, "acc_step": 0, "speed/wps": 5516.61687920954, "speed/FLOPS": 243806229456163.62, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04621228203177452, "optim/lr": 1.163489830992459e-05, "optim/total_tokens": 1977371066368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2665163278579712, "created_at": "2025-06-03T08:26:09.682051+00:00"} {"global_step": 235722, "acc_step": 0, "speed/wps": 5523.9086695102405, "speed/FLOPS": 244128489264688.47, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04657670110464096, "optim/lr": 1.1631351084830044e-05, "optim/total_tokens": 1977379454976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.270247459411621, "created_at": "2025-06-03T08:26:12.658116+00:00"} {"global_step": 235723, "acc_step": 0, "speed/wps": 5522.343084659484, "speed/FLOPS": 244059298427674.72, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046174850314855576, "optim/lr": 1.162780385973572e-05, "optim/total_tokens": 1977387843584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.253365397453308, "created_at": "2025-06-03T08:26:15.629694+00:00"} {"global_step": 235724, "acc_step": 0, "speed/wps": 5524.682432239171, "speed/FLOPS": 244162685616830.53, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046133410185575485, "optim/lr": 1.1624256634641173e-05, "optim/total_tokens": 1977396232192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2617172002792358, "created_at": "2025-06-03T08:26:18.599507+00:00"} {"global_step": 235725, "acc_step": 0, "speed/wps": 5527.773809921114, "speed/FLOPS": 244299308687267.0, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.02, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04879859462380409, "optim/lr": 1.1620709409546625e-05, "optim/total_tokens": 1977404620800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2565488815307617, "created_at": "2025-06-03T08:26:21.568220+00:00"} {"global_step": 235726, "acc_step": 0, "speed/wps": 5523.110305154475, "speed/FLOPS": 244093205646562.84, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04630473256111145, "optim/lr": 1.1617162184452079e-05, "optim/total_tokens": 1977413009408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.268869161605835, "created_at": "2025-06-03T08:26:24.538996+00:00"} {"global_step": 235727, "acc_step": 0, "speed/wps": 5510.528670154782, "speed/FLOPS": 243537161778222.22, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.7 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.7, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04908798635005951, "optim/lr": 1.1613614959357754e-05, "optim/total_tokens": 1977421398016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2456297874450684, "created_at": "2025-06-03T08:26:27.519970+00:00"} {"global_step": 235728, "acc_step": 0, "speed/wps": 5527.228059880097, "speed/FLOPS": 244275189328856.0, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.04, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.045858994126319885, "optim/lr": 1.1610067734263208e-05, "optim/total_tokens": 1977429786624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2831344604492188, "created_at": "2025-06-03T08:26:30.489116+00:00"} {"global_step": 235729, "acc_step": 0, "speed/wps": 5528.247661152112, "speed/FLOPS": 244320250486286.7, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04773794114589691, "optim/lr": 1.1606520509168662e-05, "optim/total_tokens": 1977438175232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2834945917129517, "created_at": "2025-06-03T08:26:33.460740+00:00"} {"global_step": 235730, "acc_step": 0, "speed/wps": 5530.537014972376, "speed/FLOPS": 244421428207167.22, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.045858800411224365, "optim/lr": 1.1602973284074113e-05, "optim/total_tokens": 1977446563840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2526779174804688, "created_at": "2025-06-03T08:26:36.428757+00:00"} {"global_step": 235731, "acc_step": 0, "speed/wps": 5522.0618647591855, "speed/FLOPS": 244046869947495.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04840369522571564, "optim/lr": 1.1599426058979789e-05, "optim/total_tokens": 1977454952448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2693533897399902, "created_at": "2025-06-03T08:26:39.400561+00:00"} {"global_step": 235732, "acc_step": 0, "speed/wps": 5524.006704500376, "speed/FLOPS": 244132821909463.88, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04685792699456215, "optim/lr": 1.1595878833885243e-05, "optim/total_tokens": 1977463341056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2788645029067993, "created_at": "2025-06-03T08:26:42.373521+00:00"} {"global_step": 235733, "acc_step": 0, "speed/wps": 5520.887410775486, "speed/FLOPS": 243994965092816.4, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049235545098781586, "optim/lr": 1.1592331608790696e-05, "optim/total_tokens": 1977471729664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2697073221206665, "created_at": "2025-06-03T08:26:45.349126+00:00"} {"global_step": 235734, "acc_step": 0, "speed/wps": 5520.654071652764, "speed/FLOPS": 243984652697929.97, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04673667252063751, "optim/lr": 1.158878438369615e-05, "optim/total_tokens": 1977480118272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2803337574005127, "created_at": "2025-06-03T08:26:48.322029+00:00"} {"global_step": 235735, "acc_step": 0, "speed/wps": 5513.15417279702, "speed/FLOPS": 243653195556468.38, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04563051834702492, "optim/lr": 1.1585237158601825e-05, "optim/total_tokens": 1977488506880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2583229541778564, "created_at": "2025-06-03T08:26:51.300145+00:00"} {"global_step": 235736, "acc_step": 0, "speed/wps": 5537.889777182305, "speed/FLOPS": 244746382661997.4, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 193.68, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04745762050151825, "optim/lr": 1.1581689933507277e-05, "optim/total_tokens": 1977496895488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.260380744934082, "created_at": "2025-06-03T08:26:54.263157+00:00"} {"global_step": 235737, "acc_step": 0, "speed/wps": 5525.402142928597, "speed/FLOPS": 244194493145489.88, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04753798618912697, "optim/lr": 1.1578142708412731e-05, "optim/total_tokens": 1977505284096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.27010977268219, "created_at": "2025-06-03T08:26:57.232534+00:00"} {"global_step": 235738, "acc_step": 0, "speed/wps": 5542.4537824741965, "speed/FLOPS": 244948088335202.22, "speed/curr_iter_time": 2.9539, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9539, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 193.43, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04631143435835838, "optim/lr": 1.1574595483318184e-05, "optim/total_tokens": 1977513672704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.272513508796692, "created_at": "2025-06-03T08:27:00.194271+00:00"} {"global_step": 235739, "acc_step": 0, "speed/wps": 5531.041000351242, "speed/FLOPS": 244443701781282.06, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04637305065989494, "optim/lr": 1.157104825822386e-05, "optim/total_tokens": 1977522061312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.265132188796997, "created_at": "2025-06-03T08:27:03.166279+00:00"} {"global_step": 235740, "acc_step": 0, "speed/wps": 5528.632322198465, "speed/FLOPS": 244337250535661.75, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04630879685282707, "optim/lr": 1.1567501033129314e-05, "optim/total_tokens": 1977530449920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2590447664260864, "created_at": "2025-06-03T08:27:06.134404+00:00"} {"global_step": 235741, "acc_step": 0, "speed/wps": 5522.508790017252, "speed/FLOPS": 244066621756331.16, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.14, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04715268313884735, "optim/lr": 1.1563953808034766e-05, "optim/total_tokens": 1977538838528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2610787153244019, "created_at": "2025-06-03T08:27:09.106932+00:00"} {"global_step": 235742, "acc_step": 0, "speed/wps": 5522.695022244434, "speed/FLOPS": 244074852267549.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04716581851243973, "optim/lr": 1.1560406582940441e-05, "optim/total_tokens": 1977547227136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2539578676223755, "created_at": "2025-06-03T08:27:12.077903+00:00"} {"global_step": 235743, "acc_step": 0, "speed/wps": 5519.444086515629, "speed/FLOPS": 243931177548133.97, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04687795042991638, "optim/lr": 1.1556859357845895e-05, "optim/total_tokens": 1977555615744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2684860229492188, "created_at": "2025-06-03T08:27:15.051118+00:00"} {"global_step": 235744, "acc_step": 0, "speed/wps": 5512.932317682794, "speed/FLOPS": 243643390695977.0, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.69 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.69, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04709675535559654, "optim/lr": 1.1553312132751348e-05, "optim/total_tokens": 1977564004352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2745050191879272, "created_at": "2025-06-03T08:27:18.028021+00:00"} {"global_step": 235745, "acc_step": 0, "speed/wps": 5526.90032272483, "speed/FLOPS": 244260705024104.06, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04659367725253105, "optim/lr": 1.1549764907656802e-05, "optim/total_tokens": 1977572392960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.248557686805725, "created_at": "2025-06-03T08:27:20.998449+00:00"} {"global_step": 235746, "acc_step": 0, "speed/wps": 5533.596120683583, "speed/FLOPS": 244556625021680.1, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0458899587392807, "optim/lr": 1.1546217682562476e-05, "optim/total_tokens": 1977580781568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2833569049835205, "created_at": "2025-06-03T08:27:23.963563+00:00"} {"global_step": 235747, "acc_step": 0, "speed/wps": 5525.37588768007, "speed/FLOPS": 244193332797891.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046056605875492096, "optim/lr": 1.154267045746793e-05, "optim/total_tokens": 1977589170176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2720468044281006, "created_at": "2025-06-03T08:27:26.933418+00:00"} {"global_step": 235748, "acc_step": 0, "speed/wps": 5523.807774017209, "speed/FLOPS": 244124030200326.44, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04823547229170799, "optim/lr": 1.1539123232373383e-05, "optim/total_tokens": 1977597558784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2624034881591797, "created_at": "2025-06-03T08:27:29.906650+00:00"} {"global_step": 235749, "acc_step": 0, "speed/wps": 5517.767194874182, "speed/FLOPS": 243857067520691.5, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04760705679655075, "optim/lr": 1.1535576007278837e-05, "optim/total_tokens": 1977605947392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2814431190490723, "created_at": "2025-06-03T08:27:32.880325+00:00"} {"global_step": 235750, "acc_step": 0, "speed/wps": 5518.747505308406, "speed/FLOPS": 243900392224200.56, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04850921779870987, "optim/lr": 1.1532028782184512e-05, "optim/total_tokens": 1977614336000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2713279724121094, "created_at": "2025-06-03T08:27:35.853863+00:00"} {"global_step": 235751, "acc_step": 0, "speed/wps": 5517.462211819497, "speed/FLOPS": 243843588830719.2, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04642382264137268, "optim/lr": 1.1528481557089966e-05, "optim/total_tokens": 1977622724608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2715661525726318, "created_at": "2025-06-03T08:27:38.829595+00:00"} {"global_step": 235752, "acc_step": 0, "speed/wps": 5503.99578262723, "speed/FLOPS": 243248441587854.06, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04745511710643768, "optim/lr": 1.1524934331995418e-05, "optim/total_tokens": 1977631113216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.281029462814331, "created_at": "2025-06-03T08:27:41.811057+00:00"} {"global_step": 235753, "acc_step": 0, "speed/wps": 5521.34057666008, "speed/FLOPS": 244014992705402.16, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04680471494793892, "optim/lr": 1.1521387106900871e-05, "optim/total_tokens": 1977639501824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.261961817741394, "created_at": "2025-06-03T08:27:44.785140+00:00"} {"global_step": 235754, "acc_step": 0, "speed/wps": 5528.3882432891305, "speed/FLOPS": 244326463497178.28, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046304043382406235, "optim/lr": 1.1517839881806547e-05, "optim/total_tokens": 1977647890432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2585678100585938, "created_at": "2025-06-03T08:27:47.754933+00:00"} {"global_step": 235755, "acc_step": 0, "speed/wps": 5524.467181914583, "speed/FLOPS": 244153172654234.78, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0487852543592453, "optim/lr": 1.1514292656712e-05, "optim/total_tokens": 1977656279040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2587250471115112, "created_at": "2025-06-03T08:27:50.725284+00:00"} {"global_step": 235756, "acc_step": 0, "speed/wps": 5530.759420766762, "speed/FLOPS": 244431257404903.0, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0471746101975441, "optim/lr": 1.1510745431617454e-05, "optim/total_tokens": 1977664667648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2888339757919312, "created_at": "2025-06-03T08:27:53.692603+00:00"} {"global_step": 235757, "acc_step": 0, "speed/wps": 5532.313059205852, "speed/FLOPS": 244499920271668.4, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04784143716096878, "optim/lr": 1.1507198206522906e-05, "optim/total_tokens": 1977673056256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2612289190292358, "created_at": "2025-06-03T08:27:56.661884+00:00"} {"global_step": 235758, "acc_step": 0, "speed/wps": 5524.460848431968, "speed/FLOPS": 244152892746720.88, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047693561762571335, "optim/lr": 1.1503650981428581e-05, "optim/total_tokens": 1977681444864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.279121994972229, "created_at": "2025-06-03T08:27:59.632004+00:00"} {"global_step": 235759, "acc_step": 0, "speed/wps": 5519.660840632998, "speed/FLOPS": 243940756970673.53, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046666696667671204, "optim/lr": 1.1500103756334035e-05, "optim/total_tokens": 1977689833472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.27702796459198, "created_at": "2025-06-03T08:28:02.605734+00:00"} {"global_step": 235760, "acc_step": 0, "speed/wps": 5521.205270398999, "speed/FLOPS": 244009012861222.62, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04679805785417557, "optim/lr": 1.1496556531239489e-05, "optim/total_tokens": 1977698222080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2669841051101685, "created_at": "2025-06-03T08:28:05.581307+00:00"} {"global_step": 235761, "acc_step": 0, "speed/wps": 5529.613444095754, "speed/FLOPS": 244380611101684.8, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 193.91, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04663868993520737, "optim/lr": 1.1493009306144942e-05, "optim/total_tokens": 1977706610688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2686258554458618, "created_at": "2025-06-03T08:28:08.553264+00:00"} {"global_step": 235762, "acc_step": 0, "speed/wps": 5523.848781499965, "speed/FLOPS": 244125842521168.9, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04774102196097374, "optim/lr": 1.1489462081050616e-05, "optim/total_tokens": 1977714999296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2748374938964844, "created_at": "2025-06-03T08:28:11.524177+00:00"} {"global_step": 235763, "acc_step": 0, "speed/wps": 5527.035058269642, "speed/FLOPS": 244266659645545.7, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04642274230718613, "optim/lr": 1.148591485595607e-05, "optim/total_tokens": 1977723387904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.252498745918274, "created_at": "2025-06-03T08:28:14.497285+00:00"} {"global_step": 235764, "acc_step": 0, "speed/wps": 5539.005768248884, "speed/FLOPS": 244795703754980.1, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 193.61, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04688370227813721, "optim/lr": 1.1482367630861523e-05, "optim/total_tokens": 1977731776512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2565993070602417, "created_at": "2025-06-03T08:28:17.462887+00:00"} {"global_step": 235765, "acc_step": 0, "speed/wps": 5515.612576230442, "speed/FLOPS": 243761844404976.16, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046473294496536255, "optim/lr": 1.1478820405766977e-05, "optim/total_tokens": 1977740165120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2566639184951782, "created_at": "2025-06-03T08:28:20.438029+00:00"} {"global_step": 235766, "acc_step": 0, "speed/wps": 5497.751764113478, "speed/FLOPS": 242972487929330.2, "speed/curr_iter_time": 2.9793, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9793, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.68 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.68, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05033993721008301, "optim/lr": 1.1475273180672652e-05, "optim/total_tokens": 1977748553728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2596012353897095, "created_at": "2025-06-03T08:28:23.422974+00:00"} {"global_step": 235767, "acc_step": 0, "speed/wps": 5514.355122206018, "speed/FLOPS": 243706271373329.75, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04635738953948021, "optim/lr": 1.1471725955578104e-05, "optim/total_tokens": 1977756942336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2768985033035278, "created_at": "2025-06-03T08:28:26.399105+00:00"} {"global_step": 235768, "acc_step": 0, "speed/wps": 5516.45736839766, "speed/FLOPS": 243799179894728.88, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.67 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.67, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046682652086019516, "optim/lr": 1.1468178730483558e-05, "optim/total_tokens": 1977765330944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2461837530136108, "created_at": "2025-06-03T08:28:29.373434+00:00"} {"global_step": 235769, "acc_step": 0, "speed/wps": 5518.366311278394, "speed/FLOPS": 243883545399201.94, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048271406441926956, "optim/lr": 1.1464631505389011e-05, "optim/total_tokens": 1977773719552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.26765775680542, "created_at": "2025-06-03T08:28:32.346824+00:00"} {"global_step": 235770, "acc_step": 0, "speed/wps": 5522.364551260704, "speed/FLOPS": 244060247141572.6, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049663662910461426, "optim/lr": 1.1461084280294687e-05, "optim/total_tokens": 1977782108160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2697776556015015, "created_at": "2025-06-03T08:28:35.318362+00:00"} {"global_step": 235771, "acc_step": 0, "speed/wps": 5529.850550085689, "speed/FLOPS": 244391089972821.47, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04649442061781883, "optim/lr": 1.145753705520014e-05, "optim/total_tokens": 1977790496768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.272770881652832, "created_at": "2025-06-03T08:28:38.285718+00:00"} {"global_step": 235772, "acc_step": 0, "speed/wps": 5531.836685673338, "speed/FLOPS": 244478866999832.06, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047060776501894, "optim/lr": 1.1453989830105594e-05, "optim/total_tokens": 1977798885376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2612043619155884, "created_at": "2025-06-03T08:28:41.252051+00:00"} {"global_step": 235773, "acc_step": 0, "speed/wps": 5527.5883448354825, "speed/FLOPS": 244291112079778.47, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04617505148053169, "optim/lr": 1.1450442605011268e-05, "optim/total_tokens": 1977807273984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2486480474472046, "created_at": "2025-06-03T08:28:44.220919+00:00"} {"global_step": 235774, "acc_step": 0, "speed/wps": 5529.557543231796, "speed/FLOPS": 244378140569624.44, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0465879812836647, "optim/lr": 1.1446895379916722e-05, "optim/total_tokens": 1977815662592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2602808475494385, "created_at": "2025-06-03T08:28:47.192138+00:00"} {"global_step": 235775, "acc_step": 0, "speed/wps": 5514.981726207806, "speed/FLOPS": 243733964062958.78, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04539700224995613, "optim/lr": 1.1443348154822175e-05, "optim/total_tokens": 1977824051200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2447731494903564, "created_at": "2025-06-03T08:28:50.167461+00:00"} {"global_step": 235776, "acc_step": 0, "speed/wps": 5525.066056762, "speed/FLOPS": 244179639857171.22, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047159742563962936, "optim/lr": 1.1439800929727629e-05, "optim/total_tokens": 1977832439808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2657110691070557, "created_at": "2025-06-03T08:28:53.137997+00:00"} {"global_step": 235777, "acc_step": 0, "speed/wps": 5521.993490272111, "speed/FLOPS": 244043848145139.1, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04620787128806114, "optim/lr": 1.1436253704633304e-05, "optim/total_tokens": 1977840828416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2604020833969116, "created_at": "2025-06-03T08:28:56.112679+00:00"} {"global_step": 235778, "acc_step": 0, "speed/wps": 5506.846981242577, "speed/FLOPS": 243374449972894.9, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.66 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.66, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04611311852931976, "optim/lr": 1.1432706479538756e-05, "optim/total_tokens": 1977849217024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.272912859916687, "created_at": "2025-06-03T08:28:59.095889+00:00"} {"global_step": 235779, "acc_step": 0, "speed/wps": 5536.854306018911, "speed/FLOPS": 244700620136597.28, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046617716550827026, "optim/lr": 1.142915925444421e-05, "optim/total_tokens": 1977857605632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.242568850517273, "created_at": "2025-06-03T08:29:02.059691+00:00"} {"global_step": 235780, "acc_step": 0, "speed/wps": 5529.41714971395, "speed/FLOPS": 244371935894734.78, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04749215021729469, "optim/lr": 1.1425612029349664e-05, "optim/total_tokens": 1977865994240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.276036262512207, "created_at": "2025-06-03T08:29:05.026888+00:00"} {"global_step": 235781, "acc_step": 0, "speed/wps": 5524.512701185034, "speed/FLOPS": 244155184372999.94, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046117883175611496, "optim/lr": 1.1422064804255339e-05, "optim/total_tokens": 1977874382848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2638317346572876, "created_at": "2025-06-03T08:29:08.002779+00:00"} {"global_step": 235782, "acc_step": 0, "speed/wps": 5526.843663662077, "speed/FLOPS": 244258200983537.72, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049592647701501846, "optim/lr": 1.1418517579160793e-05, "optim/total_tokens": 1977882771456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.274885654449463, "created_at": "2025-06-03T08:29:10.971437+00:00"} {"global_step": 235783, "acc_step": 0, "speed/wps": 5513.869435444642, "speed/FLOPS": 243684806504447.12, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05180114507675171, "optim/lr": 1.1414970354066245e-05, "optim/total_tokens": 1977891160064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.273565649986267, "created_at": "2025-06-03T08:29:13.947540+00:00"} {"global_step": 235784, "acc_step": 0, "speed/wps": 5519.43416133583, "speed/FLOPS": 243930738905988.53, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047224096953868866, "optim/lr": 1.1411423128971698e-05, "optim/total_tokens": 1977899548672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2622509002685547, "created_at": "2025-06-03T08:29:16.922017+00:00"} {"global_step": 235785, "acc_step": 0, "speed/wps": 5508.742440963784, "speed/FLOPS": 243458219590729.9, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049525078386068344, "optim/lr": 1.1407875903877374e-05, "optim/total_tokens": 1977907937280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2582285404205322, "created_at": "2025-06-03T08:29:19.906077+00:00"} {"global_step": 235786, "acc_step": 0, "speed/wps": 5516.944581714513, "speed/FLOPS": 243820712229550.0, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04629234969615936, "optim/lr": 1.1404328678782827e-05, "optim/total_tokens": 1977916325888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2862954139709473, "created_at": "2025-06-03T08:29:22.884071+00:00"} {"global_step": 235787, "acc_step": 0, "speed/wps": 5530.57696272547, "speed/FLOPS": 244423193693382.84, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 193.97, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05159531533718109, "optim/lr": 1.1400781453688281e-05, "optim/total_tokens": 1977924714496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2633970975875854, "created_at": "2025-06-03T08:29:25.855489+00:00"} {"global_step": 235788, "acc_step": 0, "speed/wps": 5519.355878088425, "speed/FLOPS": 243927279187143.2, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.052859291434288025, "optim/lr": 1.1397234228593733e-05, "optim/total_tokens": 1977933103104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.267959475517273, "created_at": "2025-06-03T08:29:28.828372+00:00"} {"global_step": 235789, "acc_step": 0, "speed/wps": 5524.396669122142, "speed/FLOPS": 244150056349726.06, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0495336540043354, "optim/lr": 1.1393687003499408e-05, "optim/total_tokens": 1977941491712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2642443180084229, "created_at": "2025-06-03T08:29:31.799123+00:00"} {"global_step": 235790, "acc_step": 0, "speed/wps": 5520.297450349236, "speed/FLOPS": 243968891861667.3, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05895651876926422, "optim/lr": 1.1390139778404862e-05, "optim/total_tokens": 1977949880320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2632774114608765, "created_at": "2025-06-03T08:29:34.775464+00:00"} {"global_step": 235791, "acc_step": 0, "speed/wps": 5518.383643136919, "speed/FLOPS": 243884311378636.25, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04623492807149887, "optim/lr": 1.1386592553310316e-05, "optim/total_tokens": 1977958268928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2639065980911255, "created_at": "2025-06-03T08:29:37.749680+00:00"} {"global_step": 235792, "acc_step": 0, "speed/wps": 5528.063480994589, "speed/FLOPS": 244312110666043.62, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.06149296090006828, "optim/lr": 1.138304532821577e-05, "optim/total_tokens": 1977966657536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2718366384506226, "created_at": "2025-06-03T08:29:40.719123+00:00"} {"global_step": 235793, "acc_step": 0, "speed/wps": 5514.694369188826, "speed/FLOPS": 243721264353546.44, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04895833879709244, "optim/lr": 1.1379498103121445e-05, "optim/total_tokens": 1977975046144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.253988265991211, "created_at": "2025-06-03T08:29:43.695678+00:00"} {"global_step": 235794, "acc_step": 0, "speed/wps": 5525.406524033919, "speed/FLOPS": 244194686767920.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0501401424407959, "optim/lr": 1.1375950878026897e-05, "optim/total_tokens": 1977983434752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2669066190719604, "created_at": "2025-06-03T08:29:46.665883+00:00"} {"global_step": 235795, "acc_step": 0, "speed/wps": 5508.626314886802, "speed/FLOPS": 243453087412514.44, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.65 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.65, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04742956534028053, "optim/lr": 1.137240365293235e-05, "optim/total_tokens": 1977991823360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2872331142425537, "created_at": "2025-06-03T08:29:49.644375+00:00"} {"global_step": 235796, "acc_step": 0, "speed/wps": 5527.157732297292, "speed/FLOPS": 244272081209665.22, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.1569494754076004, "optim/lr": 1.1368856427837804e-05, "optim/total_tokens": 1978000211968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2572357654571533, "created_at": "2025-06-03T08:29:52.614032+00:00"} {"global_step": 235797, "acc_step": 0, "speed/wps": 5535.115683869865, "speed/FLOPS": 244623781936684.3, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046871379017829895, "optim/lr": 1.136530920274348e-05, "optim/total_tokens": 1978008600576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2539597749710083, "created_at": "2025-06-03T08:29:55.581267+00:00"} {"global_step": 235798, "acc_step": 0, "speed/wps": 5528.208422376387, "speed/FLOPS": 244318516333241.88, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047475818544626236, "optim/lr": 1.1361761977648933e-05, "optim/total_tokens": 1978016989184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2776974439620972, "created_at": "2025-06-03T08:29:58.550036+00:00"} {"global_step": 235799, "acc_step": 0, "speed/wps": 5529.814958338754, "speed/FLOPS": 244389516999782.0, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04745548591017723, "optim/lr": 1.1358214752554385e-05, "optim/total_tokens": 1978025377792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.258881688117981, "created_at": "2025-06-03T08:30:01.518764+00:00"} {"global_step": 235800, "acc_step": 0, "speed/wps": 5524.890053557195, "speed/FLOPS": 244171861416384.9, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.64 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.64, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0467589795589447, "optim/lr": 1.135466752746006e-05, "optim/total_tokens": 1978033766400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2615193128585815, "created_at": "2025-06-03T08:30:04.490929+00:00"} {"global_step": 235801, "acc_step": 0, "speed/wps": 245.3192914189429, "speed/FLOPS": 10841857022755.643, "speed/curr_iter_time": 2.8907, "speed/data_load_time": 0.0021, "speed/curr_step_time": 2.8907, "speed/est_time_elapsed": "7.89 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 189.34, "speed/est_time_elapsed_days": 7.89, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04767587035894394, "optim/lr": 1.1351120302365514e-05, "optim/total_tokens": 1978042155008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2694883346557617, "created_at": "2025-06-03T08:31:11.284251+00:00"} {"global_step": 235802, "acc_step": 0, "speed/wps": 5640.640510845246, "speed/FLOPS": 249287439163968.2, "speed/curr_iter_time": 2.9034, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9034, "speed/est_time_elapsed": "7.92 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 190.17, "speed/est_time_elapsed_days": 7.92, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047274503856897354, "optim/lr": 1.1347573077270968e-05, "optim/total_tokens": 1978050543616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2665168046951294, "created_at": "2025-06-03T08:31:14.195743+00:00"} {"global_step": 235803, "acc_step": 0, "speed/wps": 5572.263438750508, "speed/FLOPS": 246265522562962.7, "speed/curr_iter_time": 2.9392, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9392, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 192.52, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047742750495672226, "optim/lr": 1.1344025852176421e-05, "optim/total_tokens": 1978058932224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2665140628814697, "created_at": "2025-06-03T08:31:17.143588+00:00"} {"global_step": 235804, "acc_step": 0, "speed/wps": 5567.4272989276815, "speed/FLOPS": 246051789936401.34, "speed/curr_iter_time": 2.9405, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9405, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 192.61, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04722380265593529, "optim/lr": 1.1340478627082095e-05, "optim/total_tokens": 1978067320832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.25299870967865, "created_at": "2025-06-03T08:31:20.091560+00:00"} {"global_step": 235805, "acc_step": 0, "speed/wps": 5566.000703520716, "speed/FLOPS": 245988741721390.72, "speed/curr_iter_time": 2.9426, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9426, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 192.74, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0479118674993515, "optim/lr": 1.1336931401987549e-05, "optim/total_tokens": 1978075709440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.262322187423706, "created_at": "2025-06-03T08:31:23.043350+00:00"} {"global_step": 235806, "acc_step": 0, "speed/wps": 5549.314903845883, "speed/FLOPS": 245251314781428.03, "speed/curr_iter_time": 2.9515, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9515, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0468766875565052, "optim/lr": 1.1333384176893002e-05, "optim/total_tokens": 1978084098048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2574676275253296, "created_at": "2025-06-03T08:31:26.005217+00:00"} {"global_step": 235807, "acc_step": 0, "speed/wps": 5542.824857419108, "speed/FLOPS": 244964487948433.6, "speed/curr_iter_time": 2.9536, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9536, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048588287085294724, "optim/lr": 1.1329836951798456e-05, "optim/total_tokens": 1978092486656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2665231227874756, "created_at": "2025-06-03T08:31:28.969021+00:00"} {"global_step": 235808, "acc_step": 0, "speed/wps": 5540.729542576945, "speed/FLOPS": 244871885757203.56, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04753575101494789, "optim/lr": 1.1326289726704131e-05, "optim/total_tokens": 1978100875264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.274398922920227, "created_at": "2025-06-03T08:31:31.929996+00:00"} {"global_step": 235809, "acc_step": 0, "speed/wps": 5549.310037933449, "speed/FLOPS": 245251099733004.44, "speed/curr_iter_time": 2.9515, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9515, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.33, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04658056050539017, "optim/lr": 1.1322742501609585e-05, "optim/total_tokens": 1978109263872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2761733531951904, "created_at": "2025-06-03T08:31:34.887499+00:00"} {"global_step": 235810, "acc_step": 0, "speed/wps": 5549.25437878651, "speed/FLOPS": 245248639883599.06, "speed/curr_iter_time": 2.9503, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9503, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 193.25, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04809598997235298, "optim/lr": 1.1319195276515037e-05, "optim/total_tokens": 1978117652480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2637321949005127, "created_at": "2025-06-03T08:31:37.844627+00:00"} {"global_step": 235811, "acc_step": 0, "speed/wps": 5533.650782103444, "speed/FLOPS": 244559040776655.44, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04930700734257698, "optim/lr": 1.131564805142049e-05, "optim/total_tokens": 1978126041088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2672369480133057, "created_at": "2025-06-03T08:31:40.810725+00:00"} {"global_step": 235812, "acc_step": 0, "speed/wps": 5522.046024281372, "speed/FLOPS": 244046169879455.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04816841706633568, "optim/lr": 1.1312100826326166e-05, "optim/total_tokens": 1978134429696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.276640772819519, "created_at": "2025-06-03T08:31:43.786932+00:00"} {"global_step": 235813, "acc_step": 0, "speed/wps": 5515.63051853171, "speed/FLOPS": 243762637362855.16, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05133634805679321, "optim/lr": 1.130855360123162e-05, "optim/total_tokens": 1978142818304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2673150300979614, "created_at": "2025-06-03T08:31:46.765033+00:00"} {"global_step": 235814, "acc_step": 0, "speed/wps": 5519.59051412315, "speed/FLOPS": 243937648898901.94, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.63 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.63, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04647501930594444, "optim/lr": 1.1305006376137073e-05, "optim/total_tokens": 1978151206912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2680405378341675, "created_at": "2025-06-03T08:31:49.741681+00:00"} {"global_step": 235815, "acc_step": 0, "speed/wps": 5540.451036937076, "speed/FLOPS": 244859577233442.44, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04787768796086311, "optim/lr": 1.1301459151042525e-05, "optim/total_tokens": 1978159595520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2611738443374634, "created_at": "2025-06-03T08:31:52.707458+00:00"} {"global_step": 235816, "acc_step": 0, "speed/wps": 5523.8140873572975, "speed/FLOPS": 244124309217643.72, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05037180334329605, "optim/lr": 1.12979119259482e-05, "optim/total_tokens": 1978167984128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2570970058441162, "created_at": "2025-06-03T08:31:55.683382+00:00"} {"global_step": 235817, "acc_step": 0, "speed/wps": 5522.324095396266, "speed/FLOPS": 244058459199436.34, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04620439186692238, "optim/lr": 1.1294364700853654e-05, "optim/total_tokens": 1978176372736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2569741010665894, "created_at": "2025-06-03T08:31:58.658423+00:00"} {"global_step": 235818, "acc_step": 0, "speed/wps": 5534.2523766600525, "speed/FLOPS": 244585628176817.47, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 193.87, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04990818351507187, "optim/lr": 1.1290817475759108e-05, "optim/total_tokens": 1978184761344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2674809694290161, "created_at": "2025-06-03T08:32:01.626759+00:00"} {"global_step": 235819, "acc_step": 0, "speed/wps": 5534.904563218439, "speed/FLOPS": 244614451484504.72, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049426741898059845, "optim/lr": 1.1287270250664561e-05, "optim/total_tokens": 1978193149952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2603996992111206, "created_at": "2025-06-03T08:32:04.591397+00:00"} {"global_step": 235820, "acc_step": 0, "speed/wps": 5523.503774285413, "speed/FLOPS": 244110594968192.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05158913508057594, "optim/lr": 1.1283723025570235e-05, "optim/total_tokens": 1978201538560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2609572410583496, "created_at": "2025-06-03T08:32:07.564724+00:00"} {"global_step": 235821, "acc_step": 0, "speed/wps": 5525.30253301127, "speed/FLOPS": 244190090896993.78, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047431427985429764, "optim/lr": 1.1280175800475689e-05, "optim/total_tokens": 1978209927168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2650359869003296, "created_at": "2025-06-03T08:32:10.537291+00:00"} {"global_step": 235822, "acc_step": 0, "speed/wps": 5517.720261160398, "speed/FLOPS": 243854993290770.78, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04802464693784714, "optim/lr": 1.1276628575381143e-05, "optim/total_tokens": 1978218315776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.250592589378357, "created_at": "2025-06-03T08:32:13.515960+00:00"} {"global_step": 235823, "acc_step": 0, "speed/wps": 5531.595990252491, "speed/FLOPS": 244468229494221.44, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05041240528225899, "optim/lr": 1.1273081350286596e-05, "optim/total_tokens": 1978226704384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.265331506729126, "created_at": "2025-06-03T08:32:16.483286+00:00"} {"global_step": 235824, "acc_step": 0, "speed/wps": 5528.179001368866, "speed/FLOPS": 244317216075299.8, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04751277714967728, "optim/lr": 1.1269534125192272e-05, "optim/total_tokens": 1978235092992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2652816772460938, "created_at": "2025-06-03T08:32:19.455716+00:00"} {"global_step": 235825, "acc_step": 0, "speed/wps": 5520.758977957924, "speed/FLOPS": 243989289019658.88, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.62 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.62, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04798928275704384, "optim/lr": 1.1265986900097724e-05, "optim/total_tokens": 1978243481600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.257817268371582, "created_at": "2025-06-03T08:32:22.428310+00:00"} {"global_step": 235826, "acc_step": 0, "speed/wps": 5527.216894557308, "speed/FLOPS": 244274695878738.0, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047320473939180374, "optim/lr": 1.1262439675003177e-05, "optim/total_tokens": 1978251870208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.27439546585083, "created_at": "2025-06-03T08:32:25.397767+00:00"} {"global_step": 235827, "acc_step": 0, "speed/wps": 5517.938161954858, "speed/FLOPS": 243864623390568.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0466218926012516, "optim/lr": 1.1258892449908853e-05, "optim/total_tokens": 1978260258816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2651996612548828, "created_at": "2025-06-03T08:32:28.371912+00:00"} {"global_step": 235828, "acc_step": 0, "speed/wps": 5520.046738567325, "speed/FLOPS": 243957811684166.06, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.050525229424238205, "optim/lr": 1.1255345224814306e-05, "optim/total_tokens": 1978268647424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.267418622970581, "created_at": "2025-06-03T08:32:31.345250+00:00"} {"global_step": 235829, "acc_step": 0, "speed/wps": 5526.5017944278225, "speed/FLOPS": 244243092113229.03, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049581971019506454, "optim/lr": 1.125179799971976e-05, "optim/total_tokens": 1978277036032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2634963989257812, "created_at": "2025-06-03T08:32:34.317949+00:00"} {"global_step": 235830, "acc_step": 0, "speed/wps": 5520.1946930100585, "speed/FLOPS": 243964350513235.4, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047716159373521805, "optim/lr": 1.1248250774625214e-05, "optim/total_tokens": 1978285424640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2780826091766357, "created_at": "2025-06-03T08:32:37.291347+00:00"} {"global_step": 235831, "acc_step": 0, "speed/wps": 5514.473099249356, "speed/FLOPS": 243711485354784.06, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046728551387786865, "optim/lr": 1.1244703549530887e-05, "optim/total_tokens": 1978293813248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2726069688796997, "created_at": "2025-06-03T08:32:40.267273+00:00"} {"global_step": 235832, "acc_step": 0, "speed/wps": 5520.710332311895, "speed/FLOPS": 243987139131095.4, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049773477017879486, "optim/lr": 1.1241156324436341e-05, "optim/total_tokens": 1978302201856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2755481004714966, "created_at": "2025-06-03T08:32:43.239683+00:00"} {"global_step": 235833, "acc_step": 0, "speed/wps": 5527.213517791923, "speed/FLOPS": 244274546642991.84, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048340585082769394, "optim/lr": 1.1237609099341795e-05, "optim/total_tokens": 1978310590464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2677758932113647, "created_at": "2025-06-03T08:32:46.209371+00:00"} {"global_step": 235834, "acc_step": 0, "speed/wps": 5535.279867687362, "speed/FLOPS": 244631038021048.72, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 193.75, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048240967094898224, "optim/lr": 1.1234061874247248e-05, "optim/total_tokens": 1978318979072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.261279582977295, "created_at": "2025-06-03T08:32:49.174404+00:00"} {"global_step": 235835, "acc_step": 0, "speed/wps": 5521.661775261599, "speed/FLOPS": 244029188039545.84, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047790609300136566, "optim/lr": 1.1230514649152924e-05, "optim/total_tokens": 1978327367680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2680832147598267, "created_at": "2025-06-03T08:32:52.145924+00:00"} {"global_step": 235836, "acc_step": 0, "speed/wps": 5527.757082963133, "speed/FLOPS": 244298569441340.6, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04637680575251579, "optim/lr": 1.1226967424058376e-05, "optim/total_tokens": 1978335756288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2520043849945068, "created_at": "2025-06-03T08:32:55.117548+00:00"} {"global_step": 235837, "acc_step": 0, "speed/wps": 5529.755321983381, "speed/FLOPS": 244386881378121.06, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 193.94, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04668254777789116, "optim/lr": 1.122342019896383e-05, "optim/total_tokens": 1978344144896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2688782215118408, "created_at": "2025-06-03T08:32:58.085265+00:00"} {"global_step": 235838, "acc_step": 0, "speed/wps": 5536.338832538708, "speed/FLOPS": 244677838847204.72, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 193.82, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04642760008573532, "optim/lr": 1.1219872973869283e-05, "optim/total_tokens": 1978352533504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2745823860168457, "created_at": "2025-06-03T08:33:01.052572+00:00"} {"global_step": 235839, "acc_step": 0, "speed/wps": 5516.769847670931, "speed/FLOPS": 243812989879193.56, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.61 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.61, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04565246403217316, "optim/lr": 1.1216325748774958e-05, "optim/total_tokens": 1978360922112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.269340991973877, "created_at": "2025-06-03T08:33:04.026869+00:00"} {"global_step": 235840, "acc_step": 0, "speed/wps": 5522.569986489693, "speed/FLOPS": 244069326327181.12, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046434879302978516, "optim/lr": 1.1212778523680412e-05, "optim/total_tokens": 1978369310720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2649863958358765, "created_at": "2025-06-03T08:33:07.000911+00:00"} {"global_step": 235841, "acc_step": 0, "speed/wps": 5535.9042329685535, "speed/FLOPS": 244658631770686.16, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 193.74, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04682939872145653, "optim/lr": 1.1209231298585864e-05, "optim/total_tokens": 1978377699328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2551571130752563, "created_at": "2025-06-03T08:33:09.968528+00:00"} {"global_step": 235842, "acc_step": 0, "speed/wps": 5534.27974701483, "speed/FLOPS": 244586837806404.44, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04721584543585777, "optim/lr": 1.1205684073491317e-05, "optim/total_tokens": 1978386087936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2796133756637573, "created_at": "2025-06-03T08:33:12.937370+00:00"} {"global_step": 235843, "acc_step": 0, "speed/wps": 5536.06191835742, "speed/FLOPS": 244665600657767.06, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 193.83, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04779132083058357, "optim/lr": 1.1202136848396993e-05, "optim/total_tokens": 1978394476544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2745747566223145, "created_at": "2025-06-03T08:33:15.901770+00:00"} {"global_step": 235844, "acc_step": 0, "speed/wps": 5526.2815727950565, "speed/FLOPS": 244233359444257.28, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04629163444042206, "optim/lr": 1.1198589623302447e-05, "optim/total_tokens": 1978402865152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2790672779083252, "created_at": "2025-06-03T08:33:18.873625+00:00"} {"global_step": 235845, "acc_step": 0, "speed/wps": 5528.359887064624, "speed/FLOPS": 244325210297195.38, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046421390026807785, "optim/lr": 1.11950423982079e-05, "optim/total_tokens": 1978411253760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2585018873214722, "created_at": "2025-06-03T08:33:21.842561+00:00"} {"global_step": 235846, "acc_step": 0, "speed/wps": 5524.383168059004, "speed/FLOPS": 244149459671840.06, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04759114980697632, "optim/lr": 1.1191495173113352e-05, "optim/total_tokens": 1978419642368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2513322830200195, "created_at": "2025-06-03T08:33:24.814399+00:00"} {"global_step": 235847, "acc_step": 0, "speed/wps": 5516.828555497047, "speed/FLOPS": 243815584464614.0, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04643595218658447, "optim/lr": 1.1187947948019028e-05, "optim/total_tokens": 1978428030976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2559953927993774, "created_at": "2025-06-03T08:33:27.791959+00:00"} {"global_step": 235848, "acc_step": 0, "speed/wps": 5516.61669886546, "speed/FLOPS": 243806221485878.4, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049287378787994385, "optim/lr": 1.1184400722924481e-05, "optim/total_tokens": 1978436419584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2635152339935303, "created_at": "2025-06-03T08:33:30.768791+00:00"} {"global_step": 235849, "acc_step": 0, "speed/wps": 5516.1217532875335, "speed/FLOPS": 243784347424695.16, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04743776470422745, "optim/lr": 1.1180853497829935e-05, "optim/total_tokens": 1978444808192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2642074823379517, "created_at": "2025-06-03T08:33:33.747693+00:00"} {"global_step": 235850, "acc_step": 0, "speed/wps": 5523.867458638968, "speed/FLOPS": 244126667955114.56, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.26, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047540079802274704, "optim/lr": 1.1177306272735388e-05, "optim/total_tokens": 1978453196800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2934777736663818, "created_at": "2025-06-03T08:33:36.718937+00:00"} {"global_step": 235851, "acc_step": 0, "speed/wps": 5523.904538812369, "speed/FLOPS": 244128306708985.34, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047855738550424576, "optim/lr": 1.1173759047641064e-05, "optim/total_tokens": 1978461585408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2544465065002441, "created_at": "2025-06-03T08:33:39.689904+00:00"} {"global_step": 235852, "acc_step": 0, "speed/wps": 5525.541112128226, "speed/FLOPS": 244200634872804.62, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0475434809923172, "optim/lr": 1.1170211822546516e-05, "optim/total_tokens": 1978469974016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2563964128494263, "created_at": "2025-06-03T08:33:42.660199+00:00"} {"global_step": 235853, "acc_step": 0, "speed/wps": 5515.504028705024, "speed/FLOPS": 243757047159949.28, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04828537255525589, "optim/lr": 1.116666459745197e-05, "optim/total_tokens": 1978478362624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2710520029067993, "created_at": "2025-06-03T08:33:45.635938+00:00"} {"global_step": 235854, "acc_step": 0, "speed/wps": 5516.510787030437, "speed/FLOPS": 243801540724876.3, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04801101237535477, "optim/lr": 1.1163117372357645e-05, "optim/total_tokens": 1978486751232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2549480199813843, "created_at": "2025-06-03T08:33:48.614207+00:00"} {"global_step": 235855, "acc_step": 0, "speed/wps": 5513.256922173568, "speed/FLOPS": 243657736552992.78, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.6 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.6, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047992393374443054, "optim/lr": 1.1159570147263099e-05, "optim/total_tokens": 1978495139840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2575318813323975, "created_at": "2025-06-03T08:33:51.591658+00:00"} {"global_step": 235856, "acc_step": 0, "speed/wps": 5532.081723284063, "speed/FLOPS": 244489696408009.88, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04788784310221672, "optim/lr": 1.1156022922168552e-05, "optim/total_tokens": 1978503528448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2629766464233398, "created_at": "2025-06-03T08:33:54.559262+00:00"} {"global_step": 235857, "acc_step": 0, "speed/wps": 5533.074264784052, "speed/FLOPS": 244533561662021.47, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046985287219285965, "optim/lr": 1.1152475697074004e-05, "optim/total_tokens": 1978511917056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.268338680267334, "created_at": "2025-06-03T08:33:57.528402+00:00"} {"global_step": 235858, "acc_step": 0, "speed/wps": 5523.047099624041, "speed/FLOPS": 244090412285632.88, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0487973727285862, "optim/lr": 1.114892847197968e-05, "optim/total_tokens": 1978520305664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2676396369934082, "created_at": "2025-06-03T08:34:00.499546+00:00"} {"global_step": 235859, "acc_step": 0, "speed/wps": 5518.370396480685, "speed/FLOPS": 243883725944233.22, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04651162028312683, "optim/lr": 1.1145381246885133e-05, "optim/total_tokens": 1978528694272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2771811485290527, "created_at": "2025-06-03T08:34:03.473840+00:00"} {"global_step": 235860, "acc_step": 0, "speed/wps": 5521.548276143492, "speed/FLOPS": 244024171959466.66, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0494636707007885, "optim/lr": 1.1141834021790587e-05, "optim/total_tokens": 1978537082880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2639082670211792, "created_at": "2025-06-03T08:34:06.447200+00:00"} {"global_step": 235861, "acc_step": 0, "speed/wps": 5524.739505476421, "speed/FLOPS": 244165207961789.66, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04619598761200905, "optim/lr": 1.113828679669604e-05, "optim/total_tokens": 1978545471488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2646641731262207, "created_at": "2025-06-03T08:34:09.419382+00:00"} {"global_step": 235862, "acc_step": 0, "speed/wps": 5536.134545477985, "speed/FLOPS": 244668810404756.75, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 193.84, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04932370409369469, "optim/lr": 1.1134739571601716e-05, "optim/total_tokens": 1978553860096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2689405679702759, "created_at": "2025-06-03T08:34:12.385171+00:00"} {"global_step": 235863, "acc_step": 0, "speed/wps": 5518.060009307627, "speed/FLOPS": 243870008419889.66, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04594265669584274, "optim/lr": 1.1131192346507168e-05, "optim/total_tokens": 1978562248704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.268688678741455, "created_at": "2025-06-03T08:34:15.361896+00:00"} {"global_step": 235864, "acc_step": 0, "speed/wps": 5513.766995037882, "speed/FLOPS": 243680279162805.9, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04667951539158821, "optim/lr": 1.1127645121412622e-05, "optim/total_tokens": 1978570637312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2626060247421265, "created_at": "2025-06-03T08:34:18.339442+00:00"} {"global_step": 235865, "acc_step": 0, "speed/wps": 5497.01706019004, "speed/FLOPS": 242940017776469.8, "speed/curr_iter_time": 2.9797, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9797, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.59 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.59, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047343019396066666, "optim/lr": 1.1124097896318075e-05, "optim/total_tokens": 1978579025920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2662607431411743, "created_at": "2025-06-03T08:34:21.327579+00:00"} {"global_step": 235866, "acc_step": 0, "speed/wps": 5535.01258310576, "speed/FLOPS": 244619225410628.44, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 193.88, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0467897467315197, "optim/lr": 1.112055067122375e-05, "optim/total_tokens": 1978587414528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2704880237579346, "created_at": "2025-06-03T08:34:24.293776+00:00"} {"global_step": 235867, "acc_step": 0, "speed/wps": 5531.990082732803, "speed/FLOPS": 244485646364703.06, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04588545113801956, "optim/lr": 1.1117003446129204e-05, "optim/total_tokens": 1978595803136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2672291994094849, "created_at": "2025-06-03T08:34:27.263983+00:00"} {"global_step": 235868, "acc_step": 0, "speed/wps": 5522.931888557039, "speed/FLOPS": 244085320546175.1, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04745752736926079, "optim/lr": 1.1113456221034656e-05, "optim/total_tokens": 1978604191744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.270268201828003, "created_at": "2025-06-03T08:34:30.235179+00:00"} {"global_step": 235869, "acc_step": 0, "speed/wps": 5524.171433355957, "speed/FLOPS": 244140102081721.8, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04670058935880661, "optim/lr": 1.110990899594011e-05, "optim/total_tokens": 1978612580352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.263687252998352, "created_at": "2025-06-03T08:34:33.206269+00:00"} {"global_step": 235870, "acc_step": 0, "speed/wps": 5509.627408588594, "speed/FLOPS": 243497330630071.6, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04712968319654465, "optim/lr": 1.1106361770845785e-05, "optim/total_tokens": 1978620968960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2792574167251587, "created_at": "2025-06-03T08:34:36.184466+00:00"} {"global_step": 235871, "acc_step": 0, "speed/wps": 5520.675804484915, "speed/FLOPS": 243985613177872.3, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04627472534775734, "optim/lr": 1.1102814545751239e-05, "optim/total_tokens": 1978629357568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.286451816558838, "created_at": "2025-06-03T08:34:39.159414+00:00"} {"global_step": 235872, "acc_step": 0, "speed/wps": 5522.789614191033, "speed/FLOPS": 244079032747423.84, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04666603356599808, "optim/lr": 1.1099267320656693e-05, "optim/total_tokens": 1978637746176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2721387147903442, "created_at": "2025-06-03T08:34:42.130777+00:00"} {"global_step": 235873, "acc_step": 0, "speed/wps": 5517.070131943438, "speed/FLOPS": 243826260907044.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04852291941642761, "optim/lr": 1.1095720095562144e-05, "optim/total_tokens": 1978646134784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2648009061813354, "created_at": "2025-06-03T08:34:45.110189+00:00"} {"global_step": 235874, "acc_step": 0, "speed/wps": 5538.748425802874, "speed/FLOPS": 244784330536064.53, "speed/curr_iter_time": 2.9555, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9555, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04679511487483978, "optim/lr": 1.109217287046782e-05, "optim/total_tokens": 1978654523392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2498549222946167, "created_at": "2025-06-03T08:34:48.076267+00:00"} {"global_step": 235875, "acc_step": 0, "speed/wps": 5534.233290607123, "speed/FLOPS": 244584784670969.28, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 193.92, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04816329851746559, "optim/lr": 1.1088625645373274e-05, "optim/total_tokens": 1978662912000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.250817060470581, "created_at": "2025-06-03T08:34:51.041245+00:00"} {"global_step": 235876, "acc_step": 0, "speed/wps": 5533.935884488246, "speed/FLOPS": 244571640842777.44, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 193.93, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04871007800102234, "optim/lr": 1.1085078420278727e-05, "optim/total_tokens": 1978671300608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.270214557647705, "created_at": "2025-06-03T08:34:54.013225+00:00"} {"global_step": 235877, "acc_step": 0, "speed/wps": 5510.692149478893, "speed/FLOPS": 243544386727584.88, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047183454036712646, "optim/lr": 1.108153119518418e-05, "optim/total_tokens": 1978679689216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2693097591400146, "created_at": "2025-06-03T08:34:56.991341+00:00"} {"global_step": 235878, "acc_step": 0, "speed/wps": 5527.383090520324, "speed/FLOPS": 244282040889635.28, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04627887159585953, "optim/lr": 1.1077983970089855e-05, "optim/total_tokens": 1978688077824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2631001472473145, "created_at": "2025-06-03T08:34:59.964698+00:00"} {"global_step": 235879, "acc_step": 0, "speed/wps": 5507.442623249152, "speed/FLOPS": 243400774300813.38, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.051246967166662216, "optim/lr": 1.1074436744995308e-05, "optim/total_tokens": 1978696466432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2743114233016968, "created_at": "2025-06-03T08:35:02.948635+00:00"} {"global_step": 235880, "acc_step": 0, "speed/wps": 5515.352517622927, "speed/FLOPS": 243750351145624.6, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04701614007353783, "optim/lr": 1.1070889519900762e-05, "optim/total_tokens": 1978704855040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2570865154266357, "created_at": "2025-06-03T08:35:05.923823+00:00"} {"global_step": 235881, "acc_step": 0, "speed/wps": 5511.544048765894, "speed/FLOPS": 243582036315654.5, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04797409102320671, "optim/lr": 1.1067342294806437e-05, "optim/total_tokens": 1978713243648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2676540613174438, "created_at": "2025-06-03T08:35:08.901658+00:00"} {"global_step": 235882, "acc_step": 0, "speed/wps": 5504.178332801183, "speed/FLOPS": 243256509371166.28, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.58 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.58, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0471179336309433, "optim/lr": 1.1063795069711891e-05, "optim/total_tokens": 1978721632256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2585604190826416, "created_at": "2025-06-03T08:35:11.883260+00:00"} {"global_step": 235883, "acc_step": 0, "speed/wps": 5518.801923542759, "speed/FLOPS": 243902797231621.16, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.052215736359357834, "optim/lr": 1.1060247844617345e-05, "optim/total_tokens": 1978730020864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.274785041809082, "created_at": "2025-06-03T08:35:14.858342+00:00"} {"global_step": 235884, "acc_step": 0, "speed/wps": 5532.405192392441, "speed/FLOPS": 244503992086935.22, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04600972682237625, "optim/lr": 1.1056700619522797e-05, "optim/total_tokens": 1978738409472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.26686692237854, "created_at": "2025-06-03T08:35:17.824397+00:00"} {"global_step": 235885, "acc_step": 0, "speed/wps": 5521.056837267487, "speed/FLOPS": 244002452876559.4, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04640473425388336, "optim/lr": 1.1053153394428472e-05, "optim/total_tokens": 1978746798080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2641210556030273, "created_at": "2025-06-03T08:35:20.796199+00:00"} {"global_step": 235886, "acc_step": 0, "speed/wps": 5521.117270347376, "speed/FLOPS": 244005123709365.97, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046317048370838165, "optim/lr": 1.1049606169333926e-05, "optim/total_tokens": 1978755186688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2635871171951294, "created_at": "2025-06-03T08:35:23.768230+00:00"} {"global_step": 235887, "acc_step": 0, "speed/wps": 5512.716019993791, "speed/FLOPS": 243633831445235.0, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04609498009085655, "optim/lr": 1.104605894423938e-05, "optim/total_tokens": 1978763575296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2519832849502563, "created_at": "2025-06-03T08:35:26.746790+00:00"} {"global_step": 235888, "acc_step": 0, "speed/wps": 5520.778371832997, "speed/FLOPS": 243990146129670.28, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04756629839539528, "optim/lr": 1.1042511719144833e-05, "optim/total_tokens": 1978771963904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2597118616104126, "created_at": "2025-06-03T08:35:29.719004+00:00"} {"global_step": 235889, "acc_step": 0, "speed/wps": 5516.964011084542, "speed/FLOPS": 243821570908256.72, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0464051216840744, "optim/lr": 1.1038964494050507e-05, "optim/total_tokens": 1978780352512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.266191840171814, "created_at": "2025-06-03T08:35:32.693416+00:00"} {"global_step": 235890, "acc_step": 0, "speed/wps": 5516.31798092308, "speed/FLOPS": 243793019681802.22, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.57 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.57, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04631926864385605, "optim/lr": 1.103541726895596e-05, "optim/total_tokens": 1978788741120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2863578796386719, "created_at": "2025-06-03T08:35:35.669971+00:00"} {"global_step": 235891, "acc_step": 0, "speed/wps": 5516.378382522466, "speed/FLOPS": 243795689123331.7, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04689512029290199, "optim/lr": 1.1031870043861414e-05, "optim/total_tokens": 1978797129728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2803473472595215, "created_at": "2025-06-03T08:35:38.644899+00:00"} {"global_step": 235892, "acc_step": 0, "speed/wps": 5514.02504233749, "speed/FLOPS": 243691683532642.75, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04658375680446625, "optim/lr": 1.1028322818766868e-05, "optim/total_tokens": 1978805518336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2754873037338257, "created_at": "2025-06-03T08:35:41.621018+00:00"} {"global_step": 235893, "acc_step": 0, "speed/wps": 5522.6935438036835, "speed/FLOPS": 244074786928035.8, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.34, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04763835296034813, "optim/lr": 1.1024775593672543e-05, "optim/total_tokens": 1978813906944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2559821605682373, "created_at": "2025-06-03T08:35:44.592204+00:00"} {"global_step": 235894, "acc_step": 0, "speed/wps": 5522.344402562621, "speed/FLOPS": 244059356672247.75, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047109052538871765, "optim/lr": 1.1021228368577995e-05, "optim/total_tokens": 1978822295552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2739695310592651, "created_at": "2025-06-03T08:35:47.563438+00:00"} {"global_step": 235895, "acc_step": 0, "speed/wps": 5513.026067559228, "speed/FLOPS": 243647533960660.03, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04828200116753578, "optim/lr": 1.1017681143483449e-05, "optim/total_tokens": 1978830684160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2678985595703125, "created_at": "2025-06-03T08:35:50.541071+00:00"} {"global_step": 235896, "acc_step": 0, "speed/wps": 5514.407377449189, "speed/FLOPS": 243708580787611.34, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0479389913380146, "optim/lr": 1.1014133918388902e-05, "optim/total_tokens": 1978839072768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2523711919784546, "created_at": "2025-06-03T08:35:53.519950+00:00"} {"global_step": 235897, "acc_step": 0, "speed/wps": 5508.17441523225, "speed/FLOPS": 243433115760815.34, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04830262437462807, "optim/lr": 1.1010586693294578e-05, "optim/total_tokens": 1978847461376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2757914066314697, "created_at": "2025-06-03T08:35:56.499488+00:00"} {"global_step": 235898, "acc_step": 0, "speed/wps": 5517.989844306219, "speed/FLOPS": 243866907485964.44, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04915524274110794, "optim/lr": 1.1007039468200031e-05, "optim/total_tokens": 1978855849984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2745062112808228, "created_at": "2025-06-03T08:35:59.473689+00:00"} {"global_step": 235899, "acc_step": 0, "speed/wps": 5502.88376530114, "speed/FLOPS": 243199296113861.5, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.56 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.56, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.050750695168972015, "optim/lr": 1.1003492243105483e-05, "optim/total_tokens": 1978864238592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.252219557762146, "created_at": "2025-06-03T08:36:02.456755+00:00"} {"global_step": 235900, "acc_step": 0, "speed/wps": 5525.931231809594, "speed/FLOPS": 244217876165907.53, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04851721599698067, "optim/lr": 1.0999945018010937e-05, "optim/total_tokens": 1978872627200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.271512508392334, "created_at": "2025-06-03T08:36:05.426153+00:00"} {"global_step": 235901, "acc_step": 0, "speed/wps": 5524.031562982755, "speed/FLOPS": 244133920527147.75, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04624183103442192, "optim/lr": 1.0996397792916612e-05, "optim/total_tokens": 1978881015808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2702184915542603, "created_at": "2025-06-03T08:36:08.398042+00:00"} {"global_step": 235902, "acc_step": 0, "speed/wps": 5518.014373468687, "speed/FLOPS": 243867991549393.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.052818965166807175, "optim/lr": 1.0992850567822066e-05, "optim/total_tokens": 1978889404416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2758468389511108, "created_at": "2025-06-03T08:36:11.372214+00:00"} {"global_step": 235903, "acc_step": 0, "speed/wps": 5521.839381430113, "speed/FLOPS": 244037037323123.34, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04620538651943207, "optim/lr": 1.098930334272752e-05, "optim/total_tokens": 1978897793024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2556246519088745, "created_at": "2025-06-03T08:36:14.348857+00:00"} {"global_step": 235904, "acc_step": 0, "speed/wps": 5513.911131959379, "speed/FLOPS": 243686649276976.44, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05288983881473541, "optim/lr": 1.0985756117632971e-05, "optim/total_tokens": 1978906181632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2624084949493408, "created_at": "2025-06-03T08:36:17.325348+00:00"} {"global_step": 235905, "acc_step": 0, "speed/wps": 5519.034262478355, "speed/FLOPS": 243913065423356.03, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048128169029951096, "optim/lr": 1.0982208892538647e-05, "optim/total_tokens": 1978914570240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2763822078704834, "created_at": "2025-06-03T08:36:20.299526+00:00"} {"global_step": 235906, "acc_step": 0, "speed/wps": 5510.407503836213, "speed/FLOPS": 243531806847126.9, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048049479722976685, "optim/lr": 1.09786616674441e-05, "optim/total_tokens": 1978922958848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2678824663162231, "created_at": "2025-06-03T08:36:23.283149+00:00"} {"global_step": 235907, "acc_step": 0, "speed/wps": 5516.803910150846, "speed/FLOPS": 243814495266458.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.055199891328811646, "optim/lr": 1.0975114442349554e-05, "optim/total_tokens": 1978931347456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2618705034255981, "created_at": "2025-06-03T08:36:26.261422+00:00"} {"global_step": 235908, "acc_step": 0, "speed/wps": 5528.298603902102, "speed/FLOPS": 244322501895087.56, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.06, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046913985162973404, "optim/lr": 1.097156721725523e-05, "optim/total_tokens": 1978939736064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.252547025680542, "created_at": "2025-06-03T08:36:29.233243+00:00"} {"global_step": 235909, "acc_step": 0, "speed/wps": 5522.721082113953, "speed/FLOPS": 244076003980395.9, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.05964883044362068, "optim/lr": 1.0968019992160683e-05, "optim/total_tokens": 1978948124672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2517390251159668, "created_at": "2025-06-03T08:36:32.207398+00:00"} {"global_step": 235910, "acc_step": 0, "speed/wps": 5516.637248219294, "speed/FLOPS": 243807129662136.72, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047441571950912476, "optim/lr": 1.0964472767066135e-05, "optim/total_tokens": 1978956513280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.268090844154358, "created_at": "2025-06-03T08:36:35.182352+00:00"} {"global_step": 235911, "acc_step": 0, "speed/wps": 5515.003440336452, "speed/FLOPS": 243734923716301.94, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04609198123216629, "optim/lr": 1.0960925541971589e-05, "optim/total_tokens": 1978964901888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2637828588485718, "created_at": "2025-06-03T08:36:38.158172+00:00"} {"global_step": 235912, "acc_step": 0, "speed/wps": 5526.468710172724, "speed/FLOPS": 244241629958494.25, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04875250160694122, "optim/lr": 1.0957378316877264e-05, "optim/total_tokens": 1978973290496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2618343830108643, "created_at": "2025-06-03T08:36:41.128027+00:00"} {"global_step": 235913, "acc_step": 0, "speed/wps": 5515.242039033522, "speed/FLOPS": 243745468557453.6, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04655265808105469, "optim/lr": 1.0953831091782718e-05, "optim/total_tokens": 1978981679104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2605011463165283, "created_at": "2025-06-03T08:36:44.109310+00:00"} {"global_step": 235914, "acc_step": 0, "speed/wps": 5508.985973788964, "speed/FLOPS": 243468982495088.84, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04582985118031502, "optim/lr": 1.0950283866688172e-05, "optim/total_tokens": 1978990067712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.247854232788086, "created_at": "2025-06-03T08:36:47.092205+00:00"} {"global_step": 235915, "acc_step": 0, "speed/wps": 5509.310678324097, "speed/FLOPS": 243483332773553.28, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.55 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.55, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.049780797213315964, "optim/lr": 1.0946736641593624e-05, "optim/total_tokens": 1978998456320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2736518383026123, "created_at": "2025-06-03T08:36:50.076141+00:00"} {"global_step": 235916, "acc_step": 0, "speed/wps": 5520.06927333658, "speed/FLOPS": 243958807605623.78, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047411251813173294, "optim/lr": 1.0943189416499299e-05, "optim/total_tokens": 1979006844928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2736847400665283, "created_at": "2025-06-03T08:36:53.052033+00:00"} {"global_step": 235917, "acc_step": 0, "speed/wps": 5515.874595486378, "speed/FLOPS": 243773424314952.4, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04555793106555939, "optim/lr": 1.0939642191404753e-05, "optim/total_tokens": 1979015233536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.264602780342102, "created_at": "2025-06-03T08:36:56.029837+00:00"} {"global_step": 235918, "acc_step": 0, "speed/wps": 5525.362109805022, "speed/FLOPS": 244192723886335.97, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04712881147861481, "optim/lr": 1.0936094966310206e-05, "optim/total_tokens": 1979023622144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2667080163955688, "created_at": "2025-06-03T08:36:59.003646+00:00"} {"global_step": 235919, "acc_step": 0, "speed/wps": 5518.82336348781, "speed/FLOPS": 243903744767452.8, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04632330313324928, "optim/lr": 1.093254774121566e-05, "optim/total_tokens": 1979032010752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2781256437301636, "created_at": "2025-06-03T08:37:01.980025+00:00"} {"global_step": 235920, "acc_step": 0, "speed/wps": 5519.133929613573, "speed/FLOPS": 243917470200590.03, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04636024683713913, "optim/lr": 1.0929000516121335e-05, "optim/total_tokens": 1979040399360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2546604871749878, "created_at": "2025-06-03T08:37:04.957094+00:00"} {"global_step": 235921, "acc_step": 0, "speed/wps": 5522.896827082551, "speed/FLOPS": 244083771008463.6, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04646332934498787, "optim/lr": 1.0925453291026787e-05, "optim/total_tokens": 1979048787968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2572726011276245, "created_at": "2025-06-03T08:37:07.930349+00:00"} {"global_step": 235922, "acc_step": 0, "speed/wps": 5517.376547247858, "speed/FLOPS": 243839802895123.78, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04765542969107628, "optim/lr": 1.0921906065932241e-05, "optim/total_tokens": 1979057176576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2499723434448242, "created_at": "2025-06-03T08:37:10.904862+00:00"} {"global_step": 235923, "acc_step": 0, "speed/wps": 5514.259035209456, "speed/FLOPS": 243702024819899.56, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04744259640574455, "optim/lr": 1.0918358840837695e-05, "optim/total_tokens": 1979065565184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2592387199401855, "created_at": "2025-06-03T08:37:13.880845+00:00"} {"global_step": 235924, "acc_step": 0, "speed/wps": 5515.919551706556, "speed/FLOPS": 243775411149777.5, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.047615036368370056, "optim/lr": 1.091481161574337e-05, "optim/total_tokens": 1979073953792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2595655918121338, "created_at": "2025-06-03T08:37:16.855836+00:00"} {"global_step": 235925, "acc_step": 0, "speed/wps": 5524.277887618507, "speed/FLOPS": 244144806815244.22, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04624737799167633, "optim/lr": 1.0911264390648824e-05, "optim/total_tokens": 1979082342400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2636998891830444, "created_at": "2025-06-03T08:37:19.829379+00:00"} {"global_step": 235926, "acc_step": 0, "speed/wps": 5514.497207790732, "speed/FLOPS": 243712550828914.2, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04748531058430672, "optim/lr": 1.0907717165554276e-05, "optim/total_tokens": 1979090731008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2711609601974487, "created_at": "2025-06-03T08:37:22.805148+00:00"} {"global_step": 235927, "acc_step": 0, "speed/wps": 5514.322086859338, "speed/FLOPS": 243704811380096.75, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04672724008560181, "optim/lr": 1.090416994045973e-05, "optim/total_tokens": 1979099119616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.275714635848999, "created_at": "2025-06-03T08:37:25.783248+00:00"} {"global_step": 235928, "acc_step": 0, "speed/wps": 5516.246920563226, "speed/FLOPS": 243789879177616.56, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0461624450981617, "optim/lr": 1.0900622715365405e-05, "optim/total_tokens": 1979107508224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2529561519622803, "created_at": "2025-06-03T08:37:28.762385+00:00"} {"global_step": 235929, "acc_step": 0, "speed/wps": 5511.9060894693175, "speed/FLOPS": 243598036661653.5, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04936888813972473, "optim/lr": 1.0897075490270858e-05, "optim/total_tokens": 1979115896832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2660341262817383, "created_at": "2025-06-03T08:37:31.741900+00:00"} {"global_step": 235930, "acc_step": 0, "speed/wps": 5511.224534626772, "speed/FLOPS": 243567915426126.9, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04718171805143356, "optim/lr": 1.0893528265176312e-05, "optim/total_tokens": 1979124285440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.282125473022461, "created_at": "2025-06-03T08:37:34.720275+00:00"} {"global_step": 235931, "acc_step": 0, "speed/wps": 5506.041061476352, "speed/FLOPS": 243338832444299.1, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.54 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.54, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04771167039871216, "optim/lr": 1.0889981040081764e-05, "optim/total_tokens": 1979132674048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2669551372528076, "created_at": "2025-06-03T08:37:37.701422+00:00"} {"global_step": 235932, "acc_step": 0, "speed/wps": 5504.5464892006585, "speed/FLOPS": 243272779999627.8, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046047285199165344, "optim/lr": 1.088643381498744e-05, "optim/total_tokens": 1979141062656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2538502216339111, "created_at": "2025-06-03T08:37:40.686879+00:00"} {"global_step": 235933, "acc_step": 0, "speed/wps": 5519.914084166309, "speed/FLOPS": 243951949038627.97, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04906655102968216, "optim/lr": 1.0882886589892893e-05, "optim/total_tokens": 1979149451264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2516549825668335, "created_at": "2025-06-03T08:37:43.659636+00:00"} {"global_step": 235934, "acc_step": 0, "speed/wps": 5518.987666040994, "speed/FLOPS": 243911006099326.84, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.0553511343896389, "optim/lr": 1.0879339364798347e-05, "optim/total_tokens": 1979157839872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2675437927246094, "created_at": "2025-06-03T08:37:46.635157+00:00"} {"global_step": 235935, "acc_step": 0, "speed/wps": 5521.843661994767, "speed/FLOPS": 244037226502171.16, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.046656783670186996, "optim/lr": 1.0875792139704022e-05, "optim/total_tokens": 1979166228480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2665600776672363, "created_at": "2025-06-03T08:37:49.607451+00:00"} {"global_step": 235936, "acc_step": 0, "speed/wps": 5512.694544124981, "speed/FLOPS": 243632882321757.06, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04686802625656128, "optim/lr": 1.0872244914609474e-05, "optim/total_tokens": 1979174617088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2725168466567993, "created_at": "2025-06-03T08:37:52.586780+00:00"} {"global_step": 235937, "acc_step": 0, "speed/wps": 5517.902085613156, "speed/FLOPS": 243863029000920.75, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048181865364313126, "optim/lr": 1.0868697689514928e-05, "optim/total_tokens": 1979183005696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.269365668296814, "created_at": "2025-06-03T08:37:55.560920+00:00"} {"global_step": 235938, "acc_step": 0, "speed/wps": 5508.8496439191595, "speed/FLOPS": 243462957412643.03, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04667336493730545, "optim/lr": 1.0865150464420381e-05, "optim/total_tokens": 1979191394304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2804592847824097, "created_at": "2025-06-03T08:37:58.539817+00:00"} {"global_step": 235939, "acc_step": 0, "speed/wps": 5510.354686616955, "speed/FLOPS": 243529472596378.75, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048176053911447525, "optim/lr": 1.0861603239326057e-05, "optim/total_tokens": 1979199782912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2785471677780151, "created_at": "2025-06-03T08:38:01.517643+00:00"} {"global_step": 235940, "acc_step": 0, "speed/wps": 5500.782423786949, "speed/FLOPS": 243106427574575.16, "speed/curr_iter_time": 2.9777, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9777, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04764244332909584, "optim/lr": 1.085805601423151e-05, "optim/total_tokens": 1979208171520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2649980783462524, "created_at": "2025-06-03T08:38:04.503255+00:00"} {"global_step": 235941, "acc_step": 0, "speed/wps": 5516.552690869094, "speed/FLOPS": 243803392660061.62, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04678552597761154, "optim/lr": 1.0854508789136964e-05, "optim/total_tokens": 1979216560128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2617928981781006, "created_at": "2025-06-03T08:38:07.482347+00:00"} {"global_step": 235942, "acc_step": 0, "speed/wps": 5498.881621737523, "speed/FLOPS": 243022421853177.4, "speed/curr_iter_time": 2.9769, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9769, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.048282440751791, "optim/lr": 1.0850961564042416e-05, "optim/total_tokens": 1979224948736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2472766637802124, "created_at": "2025-06-03T08:38:10.470207+00:00"} {"global_step": 235943, "acc_step": 0, "speed/wps": 5524.965678140062, "speed/FLOPS": 244175203635865.94, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0465245321393013, "optim/lr": 1.0847414338948091e-05, "optim/total_tokens": 1979233337344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.246254801750183, "created_at": "2025-06-03T08:38:13.440922+00:00"} {"global_step": 235944, "acc_step": 0, "speed/wps": 5521.806088664873, "speed/FLOPS": 244035565953307.56, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046699050813913345, "optim/lr": 1.0843867113853545e-05, "optim/total_tokens": 1979241725952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2866626977920532, "created_at": "2025-06-03T08:38:16.411988+00:00"} {"global_step": 235945, "acc_step": 0, "speed/wps": 5506.141249944111, "speed/FLOPS": 243343260261762.97, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04817633330821991, "optim/lr": 1.0840319888758999e-05, "optim/total_tokens": 1979250114560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2665371894836426, "created_at": "2025-06-03T08:38:19.396827+00:00"} {"global_step": 235946, "acc_step": 0, "speed/wps": 5515.496809647408, "speed/FLOPS": 243756728114553.12, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04610102251172066, "optim/lr": 1.0836772663664452e-05, "optim/total_tokens": 1979258503168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2436943054199219, "created_at": "2025-06-03T08:38:22.374168+00:00"} {"global_step": 235947, "acc_step": 0, "speed/wps": 5525.095597779544, "speed/FLOPS": 244180945418942.03, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05126061290502548, "optim/lr": 1.0833225438570126e-05, "optim/total_tokens": 1979266891776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2491408586502075, "created_at": "2025-06-03T08:38:25.343829+00:00"} {"global_step": 235948, "acc_step": 0, "speed/wps": 5512.981147694078, "speed/FLOPS": 243645548732541.1, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04773465916514397, "optim/lr": 1.082967821347558e-05, "optim/total_tokens": 1979275280384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2545725107192993, "created_at": "2025-06-03T08:38:28.319700+00:00"} {"global_step": 235949, "acc_step": 0, "speed/wps": 5516.787507290289, "speed/FLOPS": 243813770343979.06, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047466106712818146, "optim/lr": 1.0826130988381033e-05, "optim/total_tokens": 1979283668992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2691246271133423, "created_at": "2025-06-03T08:38:31.298517+00:00"} {"global_step": 235950, "acc_step": 0, "speed/wps": 5521.596959087335, "speed/FLOPS": 244026323496402.6, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.055759262293577194, "optim/lr": 1.0822583763286487e-05, "optim/total_tokens": 1979292057600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.265366792678833, "created_at": "2025-06-03T08:38:34.272426+00:00"} {"global_step": 235951, "acc_step": 0, "speed/wps": 5512.7686112715755, "speed/FLOPS": 243636155710526.5, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04679900407791138, "optim/lr": 1.0819036538192162e-05, "optim/total_tokens": 1979300446208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2703773975372314, "created_at": "2025-06-03T08:38:37.249113+00:00"} {"global_step": 235952, "acc_step": 0, "speed/wps": 5513.122292138435, "speed/FLOPS": 243651786594538.94, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05241215601563454, "optim/lr": 1.0815489313097614e-05, "optim/total_tokens": 1979308834816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2706053256988525, "created_at": "2025-06-03T08:38:40.227576+00:00"} {"global_step": 235953, "acc_step": 0, "speed/wps": 5509.033655687266, "speed/FLOPS": 243471089790935.75, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.52 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.52, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048205263912677765, "optim/lr": 1.0811942088003068e-05, "optim/total_tokens": 1979317223424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2654781341552734, "created_at": "2025-06-03T08:38:43.206039+00:00"} {"global_step": 235954, "acc_step": 0, "speed/wps": 5521.253871050046, "speed/FLOPS": 244011160761238.2, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04878590628504753, "optim/lr": 1.0808394862908522e-05, "optim/total_tokens": 1979325612032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2643373012542725, "created_at": "2025-06-03T08:38:46.180070+00:00"} {"global_step": 235955, "acc_step": 0, "speed/wps": 5509.239020274151, "speed/FLOPS": 243480165854524.78, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049606408923864365, "optim/lr": 1.0804847637814197e-05, "optim/total_tokens": 1979334000640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.255983591079712, "created_at": "2025-06-03T08:38:49.158320+00:00"} {"global_step": 235956, "acc_step": 0, "speed/wps": 5525.72348580399, "speed/FLOPS": 244208694855800.3, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04622480273246765, "optim/lr": 1.080130041271965e-05, "optim/total_tokens": 1979342389248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2725880146026611, "created_at": "2025-06-03T08:38:52.129469+00:00"} {"global_step": 235957, "acc_step": 0, "speed/wps": 5508.685814626468, "speed/FLOPS": 243455716996460.4, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049618352204561234, "optim/lr": 1.0797753187625103e-05, "optim/total_tokens": 1979350777856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.258533239364624, "created_at": "2025-06-03T08:38:55.107617+00:00"} {"global_step": 235958, "acc_step": 0, "speed/wps": 5529.386574014388, "speed/FLOPS": 244370584605314.78, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.15, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0467451810836792, "optim/lr": 1.0794205962530556e-05, "optim/total_tokens": 1979359166464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2566925287246704, "created_at": "2025-06-03T08:38:58.075576+00:00"} {"global_step": 235959, "acc_step": 0, "speed/wps": 5524.980640459482, "speed/FLOPS": 244175864893800.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047249242663383484, "optim/lr": 1.0790658737436232e-05, "optim/total_tokens": 1979367555072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2636486291885376, "created_at": "2025-06-03T08:39:01.049526+00:00"} {"global_step": 235960, "acc_step": 0, "speed/wps": 5511.738319820396, "speed/FLOPS": 243590622101894.1, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04658390209078789, "optim/lr": 1.0787111512341685e-05, "optim/total_tokens": 1979375943680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2582173347473145, "created_at": "2025-06-03T08:39:04.031709+00:00"} {"global_step": 235961, "acc_step": 0, "speed/wps": 5523.712776468357, "speed/FLOPS": 244119831794908.7, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046713754534721375, "optim/lr": 1.0783564287247139e-05, "optim/total_tokens": 1979384332288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.269484043121338, "created_at": "2025-06-03T08:39:07.004470+00:00"} {"global_step": 235962, "acc_step": 0, "speed/wps": 5518.622490264164, "speed/FLOPS": 243894867199130.06, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04745567962527275, "optim/lr": 1.0780017062152814e-05, "optim/total_tokens": 1979392720896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2620902061462402, "created_at": "2025-06-03T08:39:09.979901+00:00"} {"global_step": 235963, "acc_step": 0, "speed/wps": 5528.329632725363, "speed/FLOPS": 244323873210255.8, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046361830085515976, "optim/lr": 1.0776469837058266e-05, "optim/total_tokens": 1979401109504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2583599090576172, "created_at": "2025-06-03T08:39:12.952009+00:00"} {"global_step": 235964, "acc_step": 0, "speed/wps": 5508.138216380293, "speed/FLOPS": 243431515956841.38, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04723753780126572, "optim/lr": 1.077292261196372e-05, "optim/total_tokens": 1979409498112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2690962553024292, "created_at": "2025-06-03T08:39:15.937240+00:00"} {"global_step": 235965, "acc_step": 0, "speed/wps": 5502.641701108728, "speed/FLOPS": 243188598115553.75, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04772300273180008, "optim/lr": 1.0769375386869174e-05, "optim/total_tokens": 1979417886720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2534464597702026, "created_at": "2025-06-03T08:39:18.918791+00:00"} {"global_step": 235966, "acc_step": 0, "speed/wps": 5508.899822238808, "speed/FLOPS": 243465175037535.6, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.51 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.51, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046759188175201416, "optim/lr": 1.0765828161774849e-05, "optim/total_tokens": 1979426275328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2896623611450195, "created_at": "2025-06-03T08:39:21.899583+00:00"} {"global_step": 235967, "acc_step": 0, "speed/wps": 5511.644830880572, "speed/FLOPS": 243586490369273.62, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04682532325387001, "optim/lr": 1.0762280936680303e-05, "optim/total_tokens": 1979434663936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2786740064620972, "created_at": "2025-06-03T08:39:24.881377+00:00"} {"global_step": 235968, "acc_step": 0, "speed/wps": 5524.841746731137, "speed/FLOPS": 244169726501929.94, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0468730665743351, "optim/lr": 1.0758733711585755e-05, "optim/total_tokens": 1979443052544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2679132223129272, "created_at": "2025-06-03T08:39:27.852593+00:00"} {"global_step": 235969, "acc_step": 0, "speed/wps": 5519.814373698207, "speed/FLOPS": 243947542346302.3, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05089096352458, "optim/lr": 1.0755186486491208e-05, "optim/total_tokens": 1979451441152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2638064622879028, "created_at": "2025-06-03T08:39:30.826572+00:00"} {"global_step": 235970, "acc_step": 0, "speed/wps": 5520.3381930945025, "speed/FLOPS": 243970692482467.84, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04714730754494667, "optim/lr": 1.0751639261396884e-05, "optim/total_tokens": 1979459829760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2691794633865356, "created_at": "2025-06-03T08:39:33.801482+00:00"} {"global_step": 235971, "acc_step": 0, "speed/wps": 5516.616918132723, "speed/FLOPS": 243806231176369.12, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049715425819158554, "optim/lr": 1.0748092036302337e-05, "optim/total_tokens": 1979468218368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2579519748687744, "created_at": "2025-06-03T08:39:36.778779+00:00"} {"global_step": 235972, "acc_step": 0, "speed/wps": 5518.27885477982, "speed/FLOPS": 243879680269607.9, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04645995423197746, "optim/lr": 1.0744544811207791e-05, "optim/total_tokens": 1979476606976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2565977573394775, "created_at": "2025-06-03T08:39:39.754368+00:00"} {"global_step": 235973, "acc_step": 0, "speed/wps": 5520.555863716526, "speed/FLOPS": 243980312409822.03, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04818244278430939, "optim/lr": 1.0740997586113243e-05, "optim/total_tokens": 1979484995584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2610644102096558, "created_at": "2025-06-03T08:39:42.726866+00:00"} {"global_step": 235974, "acc_step": 0, "speed/wps": 5506.215409086437, "speed/FLOPS": 243346537716272.84, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048012424260377884, "optim/lr": 1.0737450361018918e-05, "optim/total_tokens": 1979493384192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2754111289978027, "created_at": "2025-06-03T08:39:45.709775+00:00"} {"global_step": 235975, "acc_step": 0, "speed/wps": 5500.367230138956, "speed/FLOPS": 243088078140487.62, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.5 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.5, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0464448519051075, "optim/lr": 1.0733903135924372e-05, "optim/total_tokens": 1979501772800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2553191184997559, "created_at": "2025-06-03T08:39:48.695862+00:00"} {"global_step": 235976, "acc_step": 0, "speed/wps": 5525.3301940945275, "speed/FLOPS": 244191313375291.53, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050570305436849594, "optim/lr": 1.0730355910829826e-05, "optim/total_tokens": 1979510161408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2709639072418213, "created_at": "2025-06-03T08:39:51.671335+00:00"} {"global_step": 235977, "acc_step": 0, "speed/wps": 5527.808178642271, "speed/FLOPS": 244300827608827.1, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.21, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04788442328572273, "optim/lr": 1.072680868573528e-05, "optim/total_tokens": 1979518550016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2584134340286255, "created_at": "2025-06-03T08:39:54.640799+00:00"} {"global_step": 235978, "acc_step": 0, "speed/wps": 5522.4604819168935, "speed/FLOPS": 244064486785558.6, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048867300152778625, "optim/lr": 1.0723261460640955e-05, "optim/total_tokens": 1979526938624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2606911659240723, "created_at": "2025-06-03T08:39:57.615974+00:00"} {"global_step": 235979, "acc_step": 0, "speed/wps": 5510.127423563811, "speed/FLOPS": 243519428732667.53, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05084269866347313, "optim/lr": 1.0719714235546407e-05, "optim/total_tokens": 1979535327232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2642061710357666, "created_at": "2025-06-03T08:40:00.596365+00:00"} {"global_step": 235980, "acc_step": 0, "speed/wps": 5534.0997798380995, "speed/FLOPS": 244578884178348.5, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04699092358350754, "optim/lr": 1.071616701045186e-05, "optim/total_tokens": 1979543715840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2556720972061157, "created_at": "2025-06-03T08:40:03.562436+00:00"} {"global_step": 235981, "acc_step": 0, "speed/wps": 5507.5550556707, "speed/FLOPS": 243405743238364.5, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050155408680438995, "optim/lr": 1.0712619785357314e-05, "optim/total_tokens": 1979552104448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2488352060317993, "created_at": "2025-06-03T08:40:06.542814+00:00"} {"global_step": 235982, "acc_step": 0, "speed/wps": 5520.116179900981, "speed/FLOPS": 243960880635680.7, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04837913438677788, "optim/lr": 1.070907256026299e-05, "optim/total_tokens": 1979560493056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2674938440322876, "created_at": "2025-06-03T08:40:09.518637+00:00"} {"global_step": 235983, "acc_step": 0, "speed/wps": 5508.649665112646, "speed/FLOPS": 243454119372979.47, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04834112897515297, "optim/lr": 1.0705525335168443e-05, "optim/total_tokens": 1979568881664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2623642683029175, "created_at": "2025-06-03T08:40:12.500469+00:00"} {"global_step": 235984, "acc_step": 0, "speed/wps": 5506.476260917119, "speed/FLOPS": 243358066032028.3, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05134330317378044, "optim/lr": 1.0701978110073895e-05, "optim/total_tokens": 1979577270272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2814197540283203, "created_at": "2025-06-03T08:40:15.482182+00:00"} {"global_step": 235985, "acc_step": 0, "speed/wps": 5518.157799162091, "speed/FLOPS": 243874330230923.06, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.46, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047400254756212234, "optim/lr": 1.0698430884979349e-05, "optim/total_tokens": 1979585658880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2621861696243286, "created_at": "2025-06-03T08:40:18.460658+00:00"} {"global_step": 235986, "acc_step": 0, "speed/wps": 5505.5720934918145, "speed/FLOPS": 243318106459778.25, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05697103589773178, "optim/lr": 1.0694883659885024e-05, "optim/total_tokens": 1979594047488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2590526342391968, "created_at": "2025-06-03T08:40:21.445346+00:00"} {"global_step": 235987, "acc_step": 0, "speed/wps": 5517.774118744024, "speed/FLOPS": 243857373520298.94, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04860083758831024, "optim/lr": 1.0691336434790478e-05, "optim/total_tokens": 1979602436096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2592145204544067, "created_at": "2025-06-03T08:40:24.419674+00:00"} {"global_step": 235988, "acc_step": 0, "speed/wps": 5512.358691046942, "speed/FLOPS": 243618039334759.62, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048926953226327896, "optim/lr": 1.0687789209695931e-05, "optim/total_tokens": 1979610824704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2678309679031372, "created_at": "2025-06-03T08:40:27.396244+00:00"} {"global_step": 235989, "acc_step": 0, "speed/wps": 5498.635340444752, "speed/FLOPS": 243011537480618.84, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05241766571998596, "optim/lr": 1.0684241984601605e-05, "optim/total_tokens": 1979619213312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2661263942718506, "created_at": "2025-06-03T08:40:30.384177+00:00"} {"global_step": 235990, "acc_step": 0, "speed/wps": 5511.447707466254, "speed/FLOPS": 243577778523329.88, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04633723199367523, "optim/lr": 1.0680694759507059e-05, "optim/total_tokens": 1979627601920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2565171718597412, "created_at": "2025-06-03T08:40:33.361182+00:00"} {"global_step": 235991, "acc_step": 0, "speed/wps": 5507.871149110403, "speed/FLOPS": 243419712950486.47, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.49 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.49, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04908721148967743, "optim/lr": 1.0677147534412512e-05, "optim/total_tokens": 1979635990528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2690112590789795, "created_at": "2025-06-03T08:40:36.340051+00:00"} {"global_step": 235992, "acc_step": 0, "speed/wps": 5514.6356008944895, "speed/FLOPS": 243718667095740.12, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048127010464668274, "optim/lr": 1.0673600309317966e-05, "optim/total_tokens": 1979644379136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.273787021636963, "created_at": "2025-06-03T08:40:39.315507+00:00"} {"global_step": 235993, "acc_step": 0, "speed/wps": 5515.814472545987, "speed/FLOPS": 243770767188724.22, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046856168657541275, "optim/lr": 1.0670053084223641e-05, "optim/total_tokens": 1979652767744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.264913558959961, "created_at": "2025-06-03T08:40:42.290008+00:00"} {"global_step": 235994, "acc_step": 0, "speed/wps": 5520.492480171529, "speed/FLOPS": 243977511181559.53, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04857279360294342, "optim/lr": 1.0666505859129093e-05, "optim/total_tokens": 1979661156352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.266871452331543, "created_at": "2025-06-03T08:40:45.262733+00:00"} {"global_step": 235995, "acc_step": 0, "speed/wps": 5524.388582788414, "speed/FLOPS": 244149698975164.9, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.47 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.47, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048224639147520065, "optim/lr": 1.0662958634034547e-05, "optim/total_tokens": 1979669544960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2708457708358765, "created_at": "2025-06-03T08:40:48.237034+00:00"} {"global_step": 235996, "acc_step": 0, "speed/wps": 5500.039200977583, "speed/FLOPS": 243073580930560.38, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04809293895959854, "optim/lr": 1.065941140894e-05, "optim/total_tokens": 1979677933568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.273105263710022, "created_at": "2025-06-03T08:40:51.224538+00:00"} {"global_step": 235997, "acc_step": 0, "speed/wps": 5501.239046721709, "speed/FLOPS": 243126607971083.5, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05096202716231346, "optim/lr": 1.0655864183845676e-05, "optim/total_tokens": 1979686322176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2740343809127808, "created_at": "2025-06-03T08:40:54.210936+00:00"} {"global_step": 235998, "acc_step": 0, "speed/wps": 5389.005188198619, "speed/FLOPS": 238166445889327.38, "speed/curr_iter_time": 3.0393, "speed/data_load_time": 0.0006, "speed/curr_step_time": 3.0393, "speed/est_time_elapsed": "8.3 days", "speed/est_time_remaining": "2.53 hours", "speed/est_time_elapsed_hrs": 199.24, "speed/est_time_elapsed_days": 8.3, "speed/est_time_remaining_hrs": 2.53, "speed/est_time_remaining_days": 0.11, "optim/grad_norm": 0.04602833464741707, "optim/lr": 1.065231695875113e-05, "optim/total_tokens": 1979694710784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2628499269485474, "created_at": "2025-06-03T08:40:57.260551+00:00"} {"global_step": 235999, "acc_step": 0, "speed/wps": 5512.473310698631, "speed/FLOPS": 243623104936687.75, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04806704819202423, "optim/lr": 1.0648769733656583e-05, "optim/total_tokens": 1979703099392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2642285823822021, "created_at": "2025-06-03T08:41:00.238647+00:00"} {"global_step": 236000, "acc_step": 0, "speed/wps": 5512.238104450595, "speed/FLOPS": 243612710024419.22, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.48 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.48, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04628809913992882, "optim/lr": 1.0645222508562035e-05, "optim/total_tokens": 1979711488000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2580705881118774, "created_at": "2025-06-03T08:41:03.216172+00:00"} {"global_step": 236001, "acc_step": 0, "speed/wps": 224.70631420876103, "speed/FLOPS": 9930868936847.387, "speed/curr_iter_time": 5.8269, "speed/data_load_time": 3.7738, "speed/curr_step_time": 5.8269, "speed/est_time_elapsed": "15.92 days", "speed/est_time_remaining": "4.85 hours", "speed/est_time_elapsed_hrs": 381.99, "speed/est_time_elapsed_days": 15.92, "speed/est_time_remaining_hrs": 4.85, "speed/est_time_remaining_days": 0.2, "optim/grad_norm": 0.04759779945015907, "optim/lr": 1.064167528346771e-05, "optim/total_tokens": 1979719876608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.274269461631775, "created_at": "2025-06-03T08:42:16.136598+00:00"} {"global_step": 236002, "acc_step": 0, "speed/wps": 5616.274097881125, "speed/FLOPS": 248210568429561.6, "speed/curr_iter_time": 2.9141, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9141, "speed/est_time_elapsed": "7.96 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 191.04, "speed/est_time_elapsed_days": 7.96, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046633001416921616, "optim/lr": 1.0638128058373164e-05, "optim/total_tokens": 1979728265216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2661057710647583, "created_at": "2025-06-03T08:42:19.061062+00:00"} {"global_step": 236003, "acc_step": 0, "speed/wps": 5600.216541777042, "speed/FLOPS": 247500906639783.97, "speed/curr_iter_time": 2.9243, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9243, "speed/est_time_elapsed": "7.99 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 191.71, "speed/est_time_elapsed_days": 7.99, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046982210129499435, "optim/lr": 1.0634580833278618e-05, "optim/total_tokens": 1979736653824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2792658805847168, "created_at": "2025-06-03T08:42:21.993611+00:00"} {"global_step": 236004, "acc_step": 0, "speed/wps": 5589.679471071364, "speed/FLOPS": 247035222048210.06, "speed/curr_iter_time": 2.9299, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9299, "speed/est_time_elapsed": "8.0 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 192.07, "speed/est_time_elapsed_days": 8.0, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049076810479164124, "optim/lr": 1.0631033608184072e-05, "optim/total_tokens": 1979745042432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.266715407371521, "created_at": "2025-06-03T08:42:24.931367+00:00"} {"global_step": 236005, "acc_step": 0, "speed/wps": 5546.289529437335, "speed/FLOPS": 245117608717840.2, "speed/curr_iter_time": 2.9529, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9529, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 193.58, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05085310339927673, "optim/lr": 1.0627486383089745e-05, "optim/total_tokens": 1979753431040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2668248414993286, "created_at": "2025-06-03T08:42:27.892076+00:00"} {"global_step": 236006, "acc_step": 0, "speed/wps": 5562.434099747589, "speed/FLOPS": 245831116090151.5, "speed/curr_iter_time": 2.943, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.943, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 192.93, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04581589251756668, "optim/lr": 1.0623939157995199e-05, "optim/total_tokens": 1979761819648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.270243763923645, "created_at": "2025-06-03T08:42:30.841255+00:00"} {"global_step": 236007, "acc_step": 0, "speed/wps": 5538.677540566677, "speed/FLOPS": 244781197771448.12, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 193.85, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04965298995375633, "optim/lr": 1.0620391932900653e-05, "optim/total_tokens": 1979770208256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2645303010940552, "created_at": "2025-06-03T08:42:33.809396+00:00"} {"global_step": 236008, "acc_step": 0, "speed/wps": 5536.281302484642, "speed/FLOPS": 244675296313280.53, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04816566780209541, "optim/lr": 1.0616844707806106e-05, "optim/total_tokens": 1979778596864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.288038730621338, "created_at": "2025-06-03T08:42:36.775670+00:00"} {"global_step": 236009, "acc_step": 0, "speed/wps": 5528.8892701935565, "speed/FLOPS": 244348606321865.72, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047259870916604996, "optim/lr": 1.0613297482711782e-05, "optim/total_tokens": 1979786985472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2650071382522583, "created_at": "2025-06-03T08:42:39.747907+00:00"} {"global_step": 236010, "acc_step": 0, "speed/wps": 5528.301552891364, "speed/FLOPS": 244322632225318.66, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05388392135500908, "optim/lr": 1.0609750257617234e-05, "optim/total_tokens": 1979795374080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2565510272979736, "created_at": "2025-06-03T08:42:42.717351+00:00"} {"global_step": 236011, "acc_step": 0, "speed/wps": 5547.331932184403, "speed/FLOPS": 245163677583759.66, "speed/curr_iter_time": 2.9525, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9525, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 193.56, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04902853071689606, "optim/lr": 1.0606203032522687e-05, "optim/total_tokens": 1979803762688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2537494897842407, "created_at": "2025-06-03T08:42:45.676282+00:00"} {"global_step": 236012, "acc_step": 0, "speed/wps": 5547.048642079735, "speed/FLOPS": 245151157611143.56, "speed/curr_iter_time": 2.9511, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9511, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 193.47, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04891190677881241, "optim/lr": 1.0602655807428141e-05, "optim/total_tokens": 1979812151296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2636555433273315, "created_at": "2025-06-03T08:42:48.637842+00:00"} {"global_step": 236013, "acc_step": 0, "speed/wps": 5534.912395646078, "speed/FLOPS": 244614797637716.38, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05125746503472328, "optim/lr": 1.0599108582333816e-05, "optim/total_tokens": 1979820539904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2751963138580322, "created_at": "2025-06-03T08:42:51.606666+00:00"} {"global_step": 236014, "acc_step": 0, "speed/wps": 5523.764520220784, "speed/FLOPS": 244122118603917.44, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046472348272800446, "optim/lr": 1.059556135723927e-05, "optim/total_tokens": 1979828928512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.266541600227356, "created_at": "2025-06-03T08:42:54.580553+00:00"} {"global_step": 236015, "acc_step": 0, "speed/wps": 5525.978247597697, "speed/FLOPS": 244219954023093.1, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050999946892261505, "optim/lr": 1.0592014132144722e-05, "optim/total_tokens": 1979837317120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.263723611831665, "created_at": "2025-06-03T08:42:57.550040+00:00"} {"global_step": 236016, "acc_step": 0, "speed/wps": 5518.429889655484, "speed/FLOPS": 243886355238045.66, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04673544317483902, "optim/lr": 1.0588466907050397e-05, "optim/total_tokens": 1979845705728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2708842754364014, "created_at": "2025-06-03T08:43:00.525566+00:00"} {"global_step": 236017, "acc_step": 0, "speed/wps": 5527.09639764165, "speed/FLOPS": 244269370531825.06, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.46 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.46, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04737601429224014, "optim/lr": 1.0584919681955851e-05, "optim/total_tokens": 1979854094336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2823327779769897, "created_at": "2025-06-03T08:43:03.494338+00:00"} {"global_step": 236018, "acc_step": 0, "speed/wps": 5532.3584351474665, "speed/FLOPS": 244501925656032.62, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04668043553829193, "optim/lr": 1.0581372456861305e-05, "optim/total_tokens": 1979862482944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2576944828033447, "created_at": "2025-06-03T08:43:06.463572+00:00"} {"global_step": 236019, "acc_step": 0, "speed/wps": 5541.959251306172, "speed/FLOPS": 244926232588815.5, "speed/curr_iter_time": 2.9537, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9537, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049777548760175705, "optim/lr": 1.0577825231766758e-05, "optim/total_tokens": 1979870871552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2911946773529053, "created_at": "2025-06-03T08:43:09.424559+00:00"} {"global_step": 236020, "acc_step": 0, "speed/wps": 5545.161998236247, "speed/FLOPS": 245067777609980.0, "speed/curr_iter_time": 2.9537, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9537, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 193.65, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04795972257852554, "optim/lr": 1.0574278006672434e-05, "optim/total_tokens": 1979879260160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2690601348876953, "created_at": "2025-06-03T08:43:12.387004+00:00"} {"global_step": 236021, "acc_step": 0, "speed/wps": 5541.666348564905, "speed/FLOPS": 244913287786863.66, "speed/curr_iter_time": 2.9556, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9556, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 193.77, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04890572652220726, "optim/lr": 1.0570730781577886e-05, "optim/total_tokens": 1979887648768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2748483419418335, "created_at": "2025-06-03T08:43:15.352507+00:00"} {"global_step": 236022, "acc_step": 0, "speed/wps": 5532.269324592238, "speed/FLOPS": 244497987425600.7, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04718824103474617, "optim/lr": 1.056718355648334e-05, "optim/total_tokens": 1979896037376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.272750735282898, "created_at": "2025-06-03T08:43:18.320839+00:00"} {"global_step": 236023, "acc_step": 0, "speed/wps": 5532.221016943703, "speed/FLOPS": 244495852474796.4, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.01, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04786711931228638, "optim/lr": 1.0563636331388793e-05, "optim/total_tokens": 1979904425984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.267632246017456, "created_at": "2025-06-03T08:43:21.287816+00:00"} {"global_step": 236024, "acc_step": 0, "speed/wps": 5530.50560668277, "speed/FLOPS": 244420040121528.84, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047503914684057236, "optim/lr": 1.0560089106294468e-05, "optim/total_tokens": 1979912814592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26866614818573, "created_at": "2025-06-03T08:43:24.257993+00:00"} {"global_step": 236025, "acc_step": 0, "speed/wps": 5523.398463628931, "speed/FLOPS": 244105940776205.0, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04691760241985321, "optim/lr": 1.0556541881199922e-05, "optim/total_tokens": 1979921203200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2658939361572266, "created_at": "2025-06-03T08:43:27.232400+00:00"} {"global_step": 236026, "acc_step": 0, "speed/wps": 5517.249433574282, "speed/FLOPS": 243834185121378.5, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04720139503479004, "optim/lr": 1.0552994656105374e-05, "optim/total_tokens": 1979929591808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2571828365325928, "created_at": "2025-06-03T08:43:30.206130+00:00"} {"global_step": 236027, "acc_step": 0, "speed/wps": 5543.1735235544165, "speed/FLOPS": 244979897206979.16, "speed/curr_iter_time": 2.9547, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9547, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 193.72, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04897686839103699, "optim/lr": 1.0549447431010828e-05, "optim/total_tokens": 1979937980416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2594854831695557, "created_at": "2025-06-03T08:43:33.167533+00:00"} {"global_step": 236028, "acc_step": 0, "speed/wps": 5536.424007561264, "speed/FLOPS": 244681603147236.44, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 193.96, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04682674631476402, "optim/lr": 1.0545900205916503e-05, "optim/total_tokens": 1979946369024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2559714317321777, "created_at": "2025-06-03T08:43:36.135304+00:00"} {"global_step": 236029, "acc_step": 0, "speed/wps": 5531.266167533341, "speed/FLOPS": 244453653018220.75, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.05, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05288058891892433, "optim/lr": 1.0542352980821957e-05, "optim/total_tokens": 1979954757632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2542834281921387, "created_at": "2025-06-03T08:43:39.101609+00:00"} {"global_step": 236030, "acc_step": 0, "speed/wps": 5519.059063242098, "speed/FLOPS": 243914161490171.66, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04636969417333603, "optim/lr": 1.053880575572741e-05, "optim/total_tokens": 1979963146240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2616251707077026, "created_at": "2025-06-03T08:43:42.074799+00:00"} {"global_step": 236031, "acc_step": 0, "speed/wps": 5526.088232386875, "speed/FLOPS": 244224814787821.56, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.33, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.051501352339982986, "optim/lr": 1.0535258530632862e-05, "optim/total_tokens": 1979971534848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2679167985916138, "created_at": "2025-06-03T08:43:45.043982+00:00"} {"global_step": 236032, "acc_step": 0, "speed/wps": 5552.251008630809, "speed/FLOPS": 245381075584575.12, "speed/curr_iter_time": 2.9499, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9499, "speed/est_time_elapsed": "8.06 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 193.41, "speed/est_time_elapsed_days": 8.06, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04810767248272896, "optim/lr": 1.0531711305538538e-05, "optim/total_tokens": 1979979923456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2708464860916138, "created_at": "2025-06-03T08:43:48.003029+00:00"} {"global_step": 236033, "acc_step": 0, "speed/wps": 5514.951652694334, "speed/FLOPS": 243732634967593.53, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0466172955930233, "optim/lr": 1.0528164080443991e-05, "optim/total_tokens": 1979988312064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2857097387313843, "created_at": "2025-06-03T08:43:50.978020+00:00"} {"global_step": 236034, "acc_step": 0, "speed/wps": 5518.615796242228, "speed/FLOPS": 243894571357623.56, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.45 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.45, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05280103161931038, "optim/lr": 1.0524616855349445e-05, "optim/total_tokens": 1979996700672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.262762188911438, "created_at": "2025-06-03T08:43:53.956135+00:00"} {"global_step": 236035, "acc_step": 0, "speed/wps": 5524.303445041029, "speed/FLOPS": 244145936322504.94, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046526502817869186, "optim/lr": 1.0521069630254899e-05, "optim/total_tokens": 1980005089280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.257885456085205, "created_at": "2025-06-03T08:43:56.929946+00:00"} {"global_step": 236036, "acc_step": 0, "speed/wps": 5532.470768434074, "speed/FLOPS": 244506890212326.78, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.0, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04761475697159767, "optim/lr": 1.0517522405160574e-05, "optim/total_tokens": 1980013477888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2638808488845825, "created_at": "2025-06-03T08:43:59.900592+00:00"} {"global_step": 236037, "acc_step": 0, "speed/wps": 5533.568032144089, "speed/FLOPS": 244555383652004.62, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04735356941819191, "optim/lr": 1.0513975180066026e-05, "optim/total_tokens": 1980021866496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2715774774551392, "created_at": "2025-06-03T08:44:02.868448+00:00"} {"global_step": 236038, "acc_step": 0, "speed/wps": 5538.4797595177415, "speed/FLOPS": 244772456861420.34, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046129144728183746, "optim/lr": 1.051042795497148e-05, "optim/total_tokens": 1980030255104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2616032361984253, "created_at": "2025-06-03T08:44:05.835520+00:00"} {"global_step": 236039, "acc_step": 0, "speed/wps": 5533.272009766767, "speed/FLOPS": 244542300978106.9, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 193.99, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047040484845638275, "optim/lr": 1.0506880729876933e-05, "optim/total_tokens": 1980038643712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.267579197883606, "created_at": "2025-06-03T08:44:08.800516+00:00"} {"global_step": 236040, "acc_step": 0, "speed/wps": 5538.667869564955, "speed/FLOPS": 244780770362672.7, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 193.89, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04857505485415459, "optim/lr": 1.0503333504782609e-05, "optim/total_tokens": 1980047032320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2693374156951904, "created_at": "2025-06-03T08:44:11.763056+00:00"} {"global_step": 236041, "acc_step": 0, "speed/wps": 5524.600971725047, "speed/FLOPS": 244159085479058.94, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.39, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046945661306381226, "optim/lr": 1.0499786279688062e-05, "optim/total_tokens": 1980055420928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.278887152671814, "created_at": "2025-06-03T08:44:14.734324+00:00"} {"global_step": 236042, "acc_step": 0, "speed/wps": 5512.364048980768, "speed/FLOPS": 243618276128010.3, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04948163777589798, "optim/lr": 1.0496239054593514e-05, "optim/total_tokens": 1980063809536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2842499017715454, "created_at": "2025-06-03T08:44:17.710557+00:00"} {"global_step": 236043, "acc_step": 0, "speed/wps": 5506.031227092529, "speed/FLOPS": 243338397814871.03, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.44 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.44, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047566089779138565, "optim/lr": 1.0492691829498968e-05, "optim/total_tokens": 1980072198144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.278684139251709, "created_at": "2025-06-03T08:44:20.692897+00:00"} {"global_step": 236044, "acc_step": 0, "speed/wps": 5532.653261845515, "speed/FLOPS": 244514955487026.53, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048821475356817245, "optim/lr": 1.0489144604404643e-05, "optim/total_tokens": 1980080586752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2719292640686035, "created_at": "2025-06-03T08:44:23.662202+00:00"} {"global_step": 236045, "acc_step": 0, "speed/wps": 5544.475095560076, "speed/FLOPS": 245037420027579.8, "speed/curr_iter_time": 2.954, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.954, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 193.69, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04629262909293175, "optim/lr": 1.0485597379310097e-05, "optim/total_tokens": 1980088975360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2739908695220947, "created_at": "2025-06-03T08:44:26.625626+00:00"} {"global_step": 236046, "acc_step": 0, "speed/wps": 5533.517035747064, "speed/FLOPS": 244553129872279.38, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 193.98, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049371138215065, "optim/lr": 1.048205015421555e-05, "optim/total_tokens": 1980097363968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2725579738616943, "created_at": "2025-06-03T08:44:29.590655+00:00"} {"global_step": 236047, "acc_step": 0, "speed/wps": 5527.422199918999, "speed/FLOPS": 244283769324876.66, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04809324070811272, "optim/lr": 1.0478502929121224e-05, "optim/total_tokens": 1980105752576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2720357179641724, "created_at": "2025-06-03T08:44:32.559097+00:00"} {"global_step": 236048, "acc_step": 0, "speed/wps": 5518.81165557348, "speed/FLOPS": 243903227337565.97, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05009343475103378, "optim/lr": 1.0474955704026678e-05, "optim/total_tokens": 1980114141184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2650072574615479, "created_at": "2025-06-03T08:44:35.536243+00:00"} {"global_step": 236049, "acc_step": 0, "speed/wps": 5515.529956340366, "speed/FLOPS": 243758193028721.72, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04737817496061325, "optim/lr": 1.0471408478932132e-05, "optim/total_tokens": 1980122529792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2845358848571777, "created_at": "2025-06-03T08:44:38.513541+00:00"} {"global_step": 236050, "acc_step": 0, "speed/wps": 5528.257586350139, "speed/FLOPS": 244320689129237.7, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047316957265138626, "optim/lr": 1.0467861253837585e-05, "optim/total_tokens": 1980130918400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2478491067886353, "created_at": "2025-06-03T08:44:41.483003+00:00"} {"global_step": 236051, "acc_step": 0, "speed/wps": 5517.952324702441, "speed/FLOPS": 243865249311520.2, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04732298478484154, "optim/lr": 1.046431402874326e-05, "optim/total_tokens": 1980139307008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2697927951812744, "created_at": "2025-06-03T08:44:44.456425+00:00"} {"global_step": 236052, "acc_step": 0, "speed/wps": 5516.552542099502, "speed/FLOPS": 243803386085207.12, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04699632152915001, "optim/lr": 1.0460766803648714e-05, "optim/total_tokens": 1980147695616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2771120071411133, "created_at": "2025-06-03T08:44:47.430733+00:00"} {"global_step": 236053, "acc_step": 0, "speed/wps": 5520.456551017095, "speed/FLOPS": 243975923296835.66, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046972814947366714, "optim/lr": 1.0457219578554166e-05, "optim/total_tokens": 1980156084224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.258853554725647, "created_at": "2025-06-03T08:44:50.406573+00:00"} {"global_step": 236054, "acc_step": 0, "speed/wps": 5532.895392677522, "speed/FLOPS": 244525656430463.28, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.1, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047474976629018784, "optim/lr": 1.045367235345962e-05, "optim/total_tokens": 1980164472832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2560375928878784, "created_at": "2025-06-03T08:44:53.375957+00:00"} {"global_step": 236055, "acc_step": 0, "speed/wps": 5517.729439040318, "speed/FLOPS": 243855398906086.56, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0466793067753315, "optim/lr": 1.0450125128365295e-05, "optim/total_tokens": 1980172861440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.278178334236145, "created_at": "2025-06-03T08:44:56.353986+00:00"} {"global_step": 236056, "acc_step": 0, "speed/wps": 5540.851580976443, "speed/FLOPS": 244877279229812.22, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 193.73, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049150414764881134, "optim/lr": 1.0446577903270749e-05, "optim/total_tokens": 1980181250048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2639687061309814, "created_at": "2025-06-03T08:44:59.315041+00:00"} {"global_step": 236057, "acc_step": 0, "speed/wps": 5511.084514573827, "speed/FLOPS": 243561727256474.34, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0478142574429512, "optim/lr": 1.0443030678176203e-05, "optim/total_tokens": 1980189638656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.261915683746338, "created_at": "2025-06-03T08:45:02.294642+00:00"} {"global_step": 236058, "acc_step": 0, "speed/wps": 5510.343489253187, "speed/FLOPS": 243528977730213.47, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04712669923901558, "optim/lr": 1.0439483453081655e-05, "optim/total_tokens": 1980198027264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2607282400131226, "created_at": "2025-06-03T08:45:05.276440+00:00"} {"global_step": 236059, "acc_step": 0, "speed/wps": 5507.879710530228, "speed/FLOPS": 243420091321421.4, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.43 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.43, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048596180975437164, "optim/lr": 1.043593622798733e-05, "optim/total_tokens": 1980206415872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2585275173187256, "created_at": "2025-06-03T08:45:08.259950+00:00"} {"global_step": 236060, "acc_step": 0, "speed/wps": 5518.560487545258, "speed/FLOPS": 243892126996313.1, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046956080943346024, "optim/lr": 1.0432389002892784e-05, "optim/total_tokens": 1980214804480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2672940492630005, "created_at": "2025-06-03T08:45:11.232937+00:00"} {"global_step": 236061, "acc_step": 0, "speed/wps": 5519.658955104952, "speed/FLOPS": 243940673639984.9, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047029901295900345, "optim/lr": 1.0428841777798237e-05, "optim/total_tokens": 1980223193088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.281762719154358, "created_at": "2025-06-03T08:45:14.206059+00:00"} {"global_step": 236062, "acc_step": 0, "speed/wps": 5533.647740808796, "speed/FLOPS": 244558906366998.75, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.09, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047044869512319565, "optim/lr": 1.0425294552703691e-05, "optim/total_tokens": 1980231581696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2655478715896606, "created_at": "2025-06-03T08:45:17.176096+00:00"} {"global_step": 236063, "acc_step": 0, "speed/wps": 5509.737825421189, "speed/FLOPS": 243502210488907.7, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04854007810354233, "optim/lr": 1.0421747327609365e-05, "optim/total_tokens": 1980239970304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2566953897476196, "created_at": "2025-06-03T08:45:20.159007+00:00"} {"global_step": 236064, "acc_step": 0, "speed/wps": 5525.42515790956, "speed/FLOPS": 244195510289847.1, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04648400470614433, "optim/lr": 1.0418200102514818e-05, "optim/total_tokens": 1980248358912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2594374418258667, "created_at": "2025-06-03T08:45:23.131177+00:00"} {"global_step": 236065, "acc_step": 0, "speed/wps": 5517.487486880439, "speed/FLOPS": 243844705859043.34, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047500595450401306, "optim/lr": 1.0414652877420272e-05, "optim/total_tokens": 1980256747520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2514443397521973, "created_at": "2025-06-03T08:45:26.108875+00:00"} {"global_step": 236066, "acc_step": 0, "speed/wps": 5526.819519537966, "speed/FLOPS": 244257133936832.84, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049074966460466385, "optim/lr": 1.0411105652325726e-05, "optim/total_tokens": 1980265136128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2506531476974487, "created_at": "2025-06-03T08:45:29.080582+00:00"} {"global_step": 236067, "acc_step": 0, "speed/wps": 5517.526580965119, "speed/FLOPS": 243846433617484.56, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04697892442345619, "optim/lr": 1.0407558427231401e-05, "optim/total_tokens": 1980273524736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2597726583480835, "created_at": "2025-06-03T08:45:32.055264+00:00"} {"global_step": 236068, "acc_step": 0, "speed/wps": 5511.496014320917, "speed/FLOPS": 243579913439049.1, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04740123450756073, "optim/lr": 1.0404011202136853e-05, "optim/total_tokens": 1980281913344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.264360785484314, "created_at": "2025-06-03T08:45:35.034677+00:00"} {"global_step": 236069, "acc_step": 0, "speed/wps": 5524.292337935085, "speed/FLOPS": 244145445445273.56, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047854986041784286, "optim/lr": 1.0400463977042307e-05, "optim/total_tokens": 1980290301952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2706849575042725, "created_at": "2025-06-03T08:45:38.005226+00:00"} {"global_step": 236070, "acc_step": 0, "speed/wps": 5529.069282676101, "speed/FLOPS": 244356561952206.75, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046373605728149414, "optim/lr": 1.039691675194776e-05, "optim/total_tokens": 1980298690560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2565873861312866, "created_at": "2025-06-03T08:45:40.974990+00:00"} {"global_step": 236071, "acc_step": 0, "speed/wps": 5521.45314400819, "speed/FLOPS": 244019967606016.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04863196238875389, "optim/lr": 1.0393369526853436e-05, "optim/total_tokens": 1980307079168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2500988245010376, "created_at": "2025-06-03T08:45:43.951259+00:00"} {"global_step": 236072, "acc_step": 0, "speed/wps": 5509.820336586838, "speed/FLOPS": 243505857060098.94, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.42 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.42, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049056120216846466, "optim/lr": 1.038982230175889e-05, "optim/total_tokens": 1980315467776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.262263536453247, "created_at": "2025-06-03T08:45:46.929413+00:00"} {"global_step": 236073, "acc_step": 0, "speed/wps": 5517.932501549191, "speed/FLOPS": 243864373229610.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04733005538582802, "optim/lr": 1.0386275076664343e-05, "optim/total_tokens": 1980323856384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2621906995773315, "created_at": "2025-06-03T08:45:49.909019+00:00"} {"global_step": 236074, "acc_step": 0, "speed/wps": 5518.978030780771, "speed/FLOPS": 243910580270142.75, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04745529219508171, "optim/lr": 1.0382727851570017e-05, "optim/total_tokens": 1980332244992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2803363800048828, "created_at": "2025-06-03T08:45:52.884078+00:00"} {"global_step": 236075, "acc_step": 0, "speed/wps": 5526.273270888659, "speed/FLOPS": 244232992542487.5, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04803886637091637, "optim/lr": 1.037918062647547e-05, "optim/total_tokens": 1980340633600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2685742378234863, "created_at": "2025-06-03T08:45:55.855350+00:00"} {"global_step": 236076, "acc_step": 0, "speed/wps": 5517.352580938227, "speed/FLOPS": 243838743706908.8, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04662695154547691, "optim/lr": 1.0375633401380924e-05, "optim/total_tokens": 1980349022208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2734038829803467, "created_at": "2025-06-03T08:45:58.834933+00:00"} {"global_step": 236077, "acc_step": 0, "speed/wps": 5519.302813865709, "speed/FLOPS": 243924934020106.47, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04976719990372658, "optim/lr": 1.0372086176286378e-05, "optim/total_tokens": 1980357410816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2667474746704102, "created_at": "2025-06-03T08:46:01.808617+00:00"} {"global_step": 236078, "acc_step": 0, "speed/wps": 5531.26041279448, "speed/FLOPS": 244453398688218.5, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04774099960923195, "optim/lr": 1.0368538951192053e-05, "optim/total_tokens": 1980365799424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2752470970153809, "created_at": "2025-06-03T08:46:04.775498+00:00"} {"global_step": 236079, "acc_step": 0, "speed/wps": 5520.59722225242, "speed/FLOPS": 243982140245416.34, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04770651459693909, "optim/lr": 1.0364991726097505e-05, "optim/total_tokens": 1980374188032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2602345943450928, "created_at": "2025-06-03T08:46:07.750162+00:00"} {"global_step": 236080, "acc_step": 0, "speed/wps": 5525.4547196880685, "speed/FLOPS": 244196816769146.28, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04871102422475815, "optim/lr": 1.0361444501002959e-05, "optim/total_tokens": 1980382576640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.268576741218567, "created_at": "2025-06-03T08:46:10.722115+00:00"} {"global_step": 236081, "acc_step": 0, "speed/wps": 5523.703520571687, "speed/FLOPS": 244119422731651.8, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.46, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04626050963997841, "optim/lr": 1.0357897275908412e-05, "optim/total_tokens": 1980390965248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2609223127365112, "created_at": "2025-06-03T08:46:13.697696+00:00"} {"global_step": 236082, "acc_step": 0, "speed/wps": 5530.09408277543, "speed/FLOPS": 244401852871194.72, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.06424965709447861, "optim/lr": 1.0354350050814088e-05, "optim/total_tokens": 1980399353856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2604066133499146, "created_at": "2025-06-03T08:46:16.666285+00:00"} {"global_step": 236083, "acc_step": 0, "speed/wps": 5515.614043100625, "speed/FLOPS": 243761909233130.12, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04824018478393555, "optim/lr": 1.0350802825719541e-05, "optim/total_tokens": 1980407742464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2728369235992432, "created_at": "2025-06-03T08:46:19.641049+00:00"} {"global_step": 236084, "acc_step": 0, "speed/wps": 5509.328153918137, "speed/FLOPS": 243484105105361.66, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04791169613599777, "optim/lr": 1.0347255600624993e-05, "optim/total_tokens": 1980416131072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2725995779037476, "created_at": "2025-06-03T08:46:22.624008+00:00"} {"global_step": 236085, "acc_step": 0, "speed/wps": 5519.898417515185, "speed/FLOPS": 243951256652837.5, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04745243117213249, "optim/lr": 1.0343708375530447e-05, "optim/total_tokens": 1980424519680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2647181749343872, "created_at": "2025-06-03T08:46:25.600201+00:00"} {"global_step": 236086, "acc_step": 0, "speed/wps": 5515.213087852876, "speed/FLOPS": 243744189063454.62, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04763798415660858, "optim/lr": 1.0340161150436122e-05, "optim/total_tokens": 1980432908288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2535680532455444, "created_at": "2025-06-03T08:46:28.578291+00:00"} {"global_step": 236087, "acc_step": 0, "speed/wps": 5510.623079253171, "speed/FLOPS": 243541334177141.44, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04886889085173607, "optim/lr": 1.0336613925341576e-05, "optim/total_tokens": 1980441296896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2656677961349487, "created_at": "2025-06-03T08:46:31.559604+00:00"} {"global_step": 236088, "acc_step": 0, "speed/wps": 5519.627639075402, "speed/FLOPS": 243939289631768.75, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04903334006667137, "optim/lr": 1.033306670024703e-05, "optim/total_tokens": 1980449685504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.281362533569336, "created_at": "2025-06-03T08:46:34.532410+00:00"} {"global_step": 236089, "acc_step": 0, "speed/wps": 5508.785949290597, "speed/FLOPS": 243460142436079.25, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047923531383275986, "optim/lr": 1.0329519475152482e-05, "optim/total_tokens": 1980458074112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2740212678909302, "created_at": "2025-06-03T08:46:37.513676+00:00"} {"global_step": 236090, "acc_step": 0, "speed/wps": 5519.812538291064, "speed/FLOPS": 243947461230701.03, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047126274555921555, "optim/lr": 1.0325972250058157e-05, "optim/total_tokens": 1980466462720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2716777324676514, "created_at": "2025-06-03T08:46:40.486423+00:00"} {"global_step": 236091, "acc_step": 0, "speed/wps": 5500.927627666654, "speed/FLOPS": 243112844842837.3, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.41 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.41, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04665744677186012, "optim/lr": 1.032242502496361e-05, "optim/total_tokens": 1980474851328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2609199285507202, "created_at": "2025-06-03T08:46:43.470238+00:00"} {"global_step": 236092, "acc_step": 0, "speed/wps": 5523.206263456124, "speed/FLOPS": 244097446512336.62, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04760781675577164, "optim/lr": 1.0318877799869064e-05, "optim/total_tokens": 1980483239936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.268753170967102, "created_at": "2025-06-03T08:46:46.444621+00:00"} {"global_step": 236093, "acc_step": 0, "speed/wps": 5518.0253419765, "speed/FLOPS": 243868476301297.3, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04748592525720596, "optim/lr": 1.0315330574774518e-05, "optim/total_tokens": 1980491628544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.267854928970337, "created_at": "2025-06-03T08:46:49.419252+00:00"} {"global_step": 236094, "acc_step": 0, "speed/wps": 5524.490062028853, "speed/FLOPS": 244154183838174.44, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04799051955342293, "optim/lr": 1.0311783349680193e-05, "optim/total_tokens": 1980500017152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2648955583572388, "created_at": "2025-06-03T08:46:52.389399+00:00"} {"global_step": 236095, "acc_step": 0, "speed/wps": 5510.745135434031, "speed/FLOPS": 243546728435595.28, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04681951925158501, "optim/lr": 1.0308236124585645e-05, "optim/total_tokens": 1980508405760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2804378271102905, "created_at": "2025-06-03T08:46:55.370585+00:00"} {"global_step": 236096, "acc_step": 0, "speed/wps": 5509.812266984172, "speed/FLOPS": 243505500424965.1, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046490006148815155, "optim/lr": 1.0304688899491099e-05, "optim/total_tokens": 1980516794368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2667337656021118, "created_at": "2025-06-03T08:46:58.349078+00:00"} {"global_step": 236097, "acc_step": 0, "speed/wps": 5507.752702557175, "speed/FLOPS": 243414478219098.22, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047216881066560745, "optim/lr": 1.0301141674396553e-05, "optim/total_tokens": 1980525182976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2580363750457764, "created_at": "2025-06-03T08:47:01.328269+00:00"} {"global_step": 236098, "acc_step": 0, "speed/wps": 5520.787578080767, "speed/FLOPS": 243990552998699.84, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04936669021844864, "optim/lr": 1.0297594449302228e-05, "optim/total_tokens": 1980533571584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2675976753234863, "created_at": "2025-06-03T08:47:04.300950+00:00"} {"global_step": 236099, "acc_step": 0, "speed/wps": 5519.764866626788, "speed/FLOPS": 243945354387145.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04928942769765854, "optim/lr": 1.0294047224207682e-05, "optim/total_tokens": 1980541960192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2598719596862793, "created_at": "2025-06-03T08:47:07.273559+00:00"} {"global_step": 236100, "acc_step": 0, "speed/wps": 5516.089813652194, "speed/FLOPS": 243782935856295.03, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05073917284607887, "optim/lr": 1.0290499999113134e-05, "optim/total_tokens": 1980550348800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2732691764831543, "created_at": "2025-06-03T08:47:10.249096+00:00"} {"global_step": 236101, "acc_step": 0, "speed/wps": 5508.902750568388, "speed/FLOPS": 243465304454714.47, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.052256323397159576, "optim/lr": 1.0286952774018809e-05, "optim/total_tokens": 1980558737408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2587878704071045, "created_at": "2025-06-03T08:47:13.227836+00:00"} {"global_step": 236102, "acc_step": 0, "speed/wps": 5502.05960983358, "speed/FLOPS": 243162872660605.44, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.4 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.4, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04636625945568085, "optim/lr": 1.0283405548924263e-05, "optim/total_tokens": 1980567126016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2530134916305542, "created_at": "2025-06-03T08:47:16.210783+00:00"} {"global_step": 236103, "acc_step": 0, "speed/wps": 5516.868109960376, "speed/FLOPS": 243817332569435.06, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047350067645311356, "optim/lr": 1.0279858323829716e-05, "optim/total_tokens": 1980575514624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.267805576324463, "created_at": "2025-06-03T08:47:19.190603+00:00"} {"global_step": 236104, "acc_step": 0, "speed/wps": 5525.385718834858, "speed/FLOPS": 244193767284612.78, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047764603048563004, "optim/lr": 1.027631109873517e-05, "optim/total_tokens": 1980583903232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2591196298599243, "created_at": "2025-06-03T08:47:22.160759+00:00"} {"global_step": 236105, "acc_step": 0, "speed/wps": 5524.052028413947, "speed/FLOPS": 244134824994454.88, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05112418904900551, "optim/lr": 1.0272763873640844e-05, "optim/total_tokens": 1980592291840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.262195348739624, "created_at": "2025-06-03T08:47:25.134525+00:00"} {"global_step": 236106, "acc_step": 0, "speed/wps": 5516.446357687718, "speed/FLOPS": 243798693277707.38, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0490545891225338, "optim/lr": 1.0269216648546297e-05, "optim/total_tokens": 1980600680448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2782353162765503, "created_at": "2025-06-03T08:47:28.110506+00:00"} {"global_step": 236107, "acc_step": 0, "speed/wps": 5518.159408886379, "speed/FLOPS": 243874401372497.3, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048459529876708984, "optim/lr": 1.0265669423451751e-05, "optim/total_tokens": 1980609069056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.250221610069275, "created_at": "2025-06-03T08:47:31.083787+00:00"} {"global_step": 236108, "acc_step": 0, "speed/wps": 5516.333372552234, "speed/FLOPS": 243793699913029.34, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049477387219667435, "optim/lr": 1.0262122198357205e-05, "optim/total_tokens": 1980617457664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2618407011032104, "created_at": "2025-06-03T08:47:34.057945+00:00"} {"global_step": 236109, "acc_step": 0, "speed/wps": 5513.640416566711, "speed/FLOPS": 243674685042267.47, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04683941602706909, "optim/lr": 1.025857497326288e-05, "optim/total_tokens": 1980625846272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2659194469451904, "created_at": "2025-06-03T08:47:37.034881+00:00"} {"global_step": 236110, "acc_step": 0, "speed/wps": 5505.561705117942, "speed/FLOPS": 243317647346825.62, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046416986733675, "optim/lr": 1.0255027748168334e-05, "optim/total_tokens": 1980634234880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2559083700180054, "created_at": "2025-06-03T08:47:40.016468+00:00"} {"global_step": 236111, "acc_step": 0, "speed/wps": 5506.8327995983045, "speed/FLOPS": 243373823216806.28, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.39 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.39, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04693824425339699, "optim/lr": 1.0251480523073786e-05, "optim/total_tokens": 1980642623488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2644761800765991, "created_at": "2025-06-03T08:47:42.999418+00:00"} {"global_step": 236112, "acc_step": 0, "speed/wps": 5525.7244156707875, "speed/FLOPS": 244208735951153.28, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04655131325125694, "optim/lr": 1.024793329797924e-05, "optim/total_tokens": 1980651012096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2551020383834839, "created_at": "2025-06-03T08:47:45.974398+00:00"} {"global_step": 236113, "acc_step": 0, "speed/wps": 5524.694269175291, "speed/FLOPS": 244163208748820.1, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046883534640073776, "optim/lr": 1.0244386072884915e-05, "optim/total_tokens": 1980659400704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2712029218673706, "created_at": "2025-06-03T08:47:48.944934+00:00"} {"global_step": 236114, "acc_step": 0, "speed/wps": 5519.22079591916, "speed/FLOPS": 243921309246674.9, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04714144766330719, "optim/lr": 1.0240838847790368e-05, "optim/total_tokens": 1980667789312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2734160423278809, "created_at": "2025-06-03T08:47:51.918434+00:00"} {"global_step": 236115, "acc_step": 0, "speed/wps": 5508.386388423732, "speed/FLOPS": 243442483890901.7, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047271016985177994, "optim/lr": 1.0237291622695822e-05, "optim/total_tokens": 1980676177920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.272303581237793, "created_at": "2025-06-03T08:47:54.898187+00:00"} {"global_step": 236116, "acc_step": 0, "speed/wps": 5527.249361728841, "speed/FLOPS": 244276130761537.75, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04648945480585098, "optim/lr": 1.0233744397601274e-05, "optim/total_tokens": 1980684566528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.266592264175415, "created_at": "2025-06-03T08:47:57.871050+00:00"} {"global_step": 236117, "acc_step": 0, "speed/wps": 5511.364534168844, "speed/FLOPS": 243574102689303.9, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04668542742729187, "optim/lr": 1.023019717250695e-05, "optim/total_tokens": 1980692955136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2713241577148438, "created_at": "2025-06-03T08:48:00.851232+00:00"} {"global_step": 236118, "acc_step": 0, "speed/wps": 5517.710568888544, "speed/FLOPS": 243854564941964.38, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047254834324121475, "optim/lr": 1.0226649947412403e-05, "optim/total_tokens": 1980701343744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2458415031433105, "created_at": "2025-06-03T08:48:03.829191+00:00"} {"global_step": 236119, "acc_step": 0, "speed/wps": 5503.9572700804065, "speed/FLOPS": 243246739530409.53, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.38 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.38, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04605196788907051, "optim/lr": 1.0223102722317857e-05, "optim/total_tokens": 1980709732352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2810324430465698, "created_at": "2025-06-03T08:48:06.810574+00:00"} {"global_step": 236120, "acc_step": 0, "speed/wps": 5520.147814124594, "speed/FLOPS": 243962278706445.78, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04910902678966522, "optim/lr": 1.021955549722331e-05, "optim/total_tokens": 1980718120960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2680617570877075, "created_at": "2025-06-03T08:48:09.785961+00:00"} {"global_step": 236121, "acc_step": 0, "speed/wps": 5517.773776941631, "speed/FLOPS": 243857358414382.66, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046323396265506744, "optim/lr": 1.0216008272128984e-05, "optim/total_tokens": 1980726509568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.249626874923706, "created_at": "2025-06-03T08:48:12.759620+00:00"} {"global_step": 236122, "acc_step": 0, "speed/wps": 5523.318059771938, "speed/FLOPS": 244102387337270.2, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04893660545349121, "optim/lr": 1.0212461047034438e-05, "optim/total_tokens": 1980734898176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2607859373092651, "created_at": "2025-06-03T08:48:15.730530+00:00"} {"global_step": 236123, "acc_step": 0, "speed/wps": 5520.530246109986, "speed/FLOPS": 243979180242735.78, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04740482196211815, "optim/lr": 1.0208913821939891e-05, "optim/total_tokens": 1980743286784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2572427988052368, "created_at": "2025-06-03T08:48:18.702924+00:00"} {"global_step": 236124, "acc_step": 0, "speed/wps": 5520.269869080655, "speed/FLOPS": 243967672910769.75, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04877251386642456, "optim/lr": 1.0205366596845345e-05, "optim/total_tokens": 1980751675392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2675814628601074, "created_at": "2025-06-03T08:48:21.680658+00:00"} {"global_step": 236125, "acc_step": 0, "speed/wps": 5509.102148240657, "speed/FLOPS": 243474116811218.94, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04630839824676514, "optim/lr": 1.020181937175102e-05, "optim/total_tokens": 1980760064000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2725073099136353, "created_at": "2025-06-03T08:48:24.660870+00:00"} {"global_step": 236126, "acc_step": 0, "speed/wps": 5511.80148393763, "speed/FLOPS": 243593413632572.56, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04785003140568733, "optim/lr": 1.0198272146656472e-05, "optim/total_tokens": 1980768452608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2636851072311401, "created_at": "2025-06-03T08:48:27.638957+00:00"} {"global_step": 236127, "acc_step": 0, "speed/wps": 5506.57766616158, "speed/FLOPS": 243362547624794.38, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046611588448286057, "optim/lr": 1.0194724921561926e-05, "optim/total_tokens": 1980776841216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.25603187084198, "created_at": "2025-06-03T08:48:30.618618+00:00"} {"global_step": 236128, "acc_step": 0, "speed/wps": 5525.411776770561, "speed/FLOPS": 244194918911994.22, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04654987156391144, "optim/lr": 1.0191177696467601e-05, "optim/total_tokens": 1980785229824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2524551153182983, "created_at": "2025-06-03T08:48:33.591794+00:00"} {"global_step": 236129, "acc_step": 0, "speed/wps": 5523.831356757654, "speed/FLOPS": 244125072436746.7, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047201212495565414, "optim/lr": 1.0187630471373055e-05, "optim/total_tokens": 1980793618432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2536581754684448, "created_at": "2025-06-03T08:48:36.565028+00:00"} {"global_step": 236130, "acc_step": 0, "speed/wps": 5509.075790184731, "speed/FLOPS": 243472951920059.78, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04670661687850952, "optim/lr": 1.0184083246278509e-05, "optim/total_tokens": 1980802007040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26214599609375, "created_at": "2025-06-03T08:48:39.543412+00:00"} {"global_step": 236131, "acc_step": 0, "speed/wps": 5522.437590440294, "speed/FLOPS": 244063475099462.1, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04706161841750145, "optim/lr": 1.0180536021183962e-05, "optim/total_tokens": 1980810395648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2734652757644653, "created_at": "2025-06-03T08:48:42.514311+00:00"} {"global_step": 236132, "acc_step": 0, "speed/wps": 5513.91978518422, "speed/FLOPS": 243687031705223.16, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046404946595430374, "optim/lr": 1.0176988796089636e-05, "optim/total_tokens": 1980818784256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.272271990776062, "created_at": "2025-06-03T08:48:45.490403+00:00"} {"global_step": 236133, "acc_step": 0, "speed/wps": 5508.205540640944, "speed/FLOPS": 243434491344565.34, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046901654452085495, "optim/lr": 1.017344157099509e-05, "optim/total_tokens": 1980827172864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2491066455841064, "created_at": "2025-06-03T08:48:48.474811+00:00"} {"global_step": 236134, "acc_step": 0, "speed/wps": 5511.370305424802, "speed/FLOPS": 243574357749277.25, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046728529036045074, "optim/lr": 1.0169894345900543e-05, "optim/total_tokens": 1980835561472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2652688026428223, "created_at": "2025-06-03T08:48:51.451645+00:00"} {"global_step": 236135, "acc_step": 0, "speed/wps": 5505.088131322291, "speed/FLOPS": 243296717809028.25, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.37 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.37, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04687078669667244, "optim/lr": 1.0166347120805997e-05, "optim/total_tokens": 1980843950080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2544916868209839, "created_at": "2025-06-03T08:48:54.432463+00:00"} {"global_step": 236136, "acc_step": 0, "speed/wps": 5519.7346560634705, "speed/FLOPS": 243944019234878.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05230381339788437, "optim/lr": 1.0162799895711672e-05, "optim/total_tokens": 1980852338688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.257152795791626, "created_at": "2025-06-03T08:48:57.404948+00:00"} {"global_step": 236137, "acc_step": 0, "speed/wps": 5525.3481584587225, "speed/FLOPS": 244192107308239.0, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046809807419776917, "optim/lr": 1.0159252670617124e-05, "optim/total_tokens": 1980860727296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2760450839996338, "created_at": "2025-06-03T08:49:00.374779+00:00"} {"global_step": 236138, "acc_step": 0, "speed/wps": 5521.836597485106, "speed/FLOPS": 244036914287003.56, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04700125381350517, "optim/lr": 1.0155705445522578e-05, "optim/total_tokens": 1980869115904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2670446634292603, "created_at": "2025-06-03T08:49:03.348673+00:00"} {"global_step": 236139, "acc_step": 0, "speed/wps": 5520.16816851183, "speed/FLOPS": 243963178266178.4, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04615342617034912, "optim/lr": 1.0152158220428032e-05, "optim/total_tokens": 1980877504512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.267322301864624, "created_at": "2025-06-03T08:49:06.321216+00:00"} {"global_step": 236140, "acc_step": 0, "speed/wps": 5516.147989415289, "speed/FLOPS": 243785506927253.28, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047980573028326035, "optim/lr": 1.0148610995333707e-05, "optim/total_tokens": 1980885893120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.262445092201233, "created_at": "2025-06-03T08:49:09.299990+00:00"} {"global_step": 236141, "acc_step": 0, "speed/wps": 5506.324789981388, "speed/FLOPS": 243351371791967.5, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04725418612360954, "optim/lr": 1.014506377023916e-05, "optim/total_tokens": 1980894281728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2628309726715088, "created_at": "2025-06-03T08:49:12.280174+00:00"} {"global_step": 236142, "acc_step": 0, "speed/wps": 5510.78311855698, "speed/FLOPS": 243548407095214.38, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.051224563270807266, "optim/lr": 1.0141516545144613e-05, "optim/total_tokens": 1980902670336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.252465844154358, "created_at": "2025-06-03T08:49:15.260167+00:00"} {"global_step": 236143, "acc_step": 0, "speed/wps": 5502.874987458859, "speed/FLOPS": 243198908178161.78, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04712982103228569, "optim/lr": 1.0137969320050066e-05, "optim/total_tokens": 1980911058944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2624143362045288, "created_at": "2025-06-03T08:49:18.242089+00:00"} {"global_step": 236144, "acc_step": 0, "speed/wps": 5510.275208325439, "speed/FLOPS": 243525960062700.5, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.36 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.36, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04764658957719803, "optim/lr": 1.0134422094955742e-05, "optim/total_tokens": 1980919447552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2572823762893677, "created_at": "2025-06-03T08:49:21.220191+00:00"} {"global_step": 236145, "acc_step": 0, "speed/wps": 5525.948054035658, "speed/FLOPS": 244218619622195.62, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04673081263899803, "optim/lr": 1.0130874869861195e-05, "optim/total_tokens": 1980927836160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.280602216720581, "created_at": "2025-06-03T08:49:24.189433+00:00"} {"global_step": 236146, "acc_step": 0, "speed/wps": 5531.658084468337, "speed/FLOPS": 244470973740734.8, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04624471440911293, "optim/lr": 1.0127327644766649e-05, "optim/total_tokens": 1980936224768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2618016004562378, "created_at": "2025-06-03T08:49:27.159235+00:00"} {"global_step": 236147, "acc_step": 0, "speed/wps": 5528.968821967825, "speed/FLOPS": 244352122103105.47, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04878515750169754, "optim/lr": 1.0123780419672101e-05, "optim/total_tokens": 1980944613376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2599718570709229, "created_at": "2025-06-03T08:49:30.127075+00:00"} {"global_step": 236148, "acc_step": 0, "speed/wps": 5525.411666570152, "speed/FLOPS": 244194914041700.22, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0460815392434597, "optim/lr": 1.0120233194577776e-05, "optim/total_tokens": 1980953001984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2611943483352661, "created_at": "2025-06-03T08:49:33.096868+00:00"} {"global_step": 236149, "acc_step": 0, "speed/wps": 5522.314239163354, "speed/FLOPS": 244058023604390.38, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04846379905939102, "optim/lr": 1.011668596948323e-05, "optim/total_tokens": 1980961390592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2456698417663574, "created_at": "2025-06-03T08:49:36.070239+00:00"} {"global_step": 236150, "acc_step": 0, "speed/wps": 5519.310790079164, "speed/FLOPS": 243925286527915.22, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04674052447080612, "optim/lr": 1.0113138744388684e-05, "optim/total_tokens": 1980969779200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.25576913356781, "created_at": "2025-06-03T08:49:39.046972+00:00"} {"global_step": 236151, "acc_step": 0, "speed/wps": 5519.207171229949, "speed/FLOPS": 243920707105149.28, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04637966677546501, "optim/lr": 1.0109591519294137e-05, "optim/total_tokens": 1980978167808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.276707649230957, "created_at": "2025-06-03T08:49:42.019862+00:00"} {"global_step": 236152, "acc_step": 0, "speed/wps": 5521.536061891581, "speed/FLOPS": 244023632152050.38, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0465683676302433, "optim/lr": 1.0106044294199813e-05, "optim/total_tokens": 1980986556416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.272434949874878, "created_at": "2025-06-03T08:49:44.991417+00:00"} {"global_step": 236153, "acc_step": 0, "speed/wps": 5517.546999955792, "speed/FLOPS": 243847336032358.4, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050000596791505814, "optim/lr": 1.0102497069105265e-05, "optim/total_tokens": 1980994945024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2687065601348877, "created_at": "2025-06-03T08:49:47.965185+00:00"} {"global_step": 236154, "acc_step": 0, "speed/wps": 5515.712004385524, "speed/FLOPS": 243766238620511.34, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05613178759813309, "optim/lr": 1.0098949844010718e-05, "optim/total_tokens": 1981003333632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2700386047363281, "created_at": "2025-06-03T08:49:50.943883+00:00"} {"global_step": 236155, "acc_step": 0, "speed/wps": 5517.802875726153, "speed/FLOPS": 243858644431717.44, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05312614142894745, "optim/lr": 1.0095402618916394e-05, "optim/total_tokens": 1981011722240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2801916599273682, "created_at": "2025-06-03T08:49:53.920013+00:00"} {"global_step": 236156, "acc_step": 0, "speed/wps": 5519.896347802296, "speed/FLOPS": 243951165182121.53, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04635219648480415, "optim/lr": 1.0091855393821847e-05, "optim/total_tokens": 1981020110848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2733930349349976, "created_at": "2025-06-03T08:49:56.893184+00:00"} {"global_step": 236157, "acc_step": 0, "speed/wps": 5509.9856139792, "speed/FLOPS": 243513161474874.97, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04894557222723961, "optim/lr": 1.0088308168727301e-05, "optim/total_tokens": 1981028499456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2803202867507935, "created_at": "2025-06-03T08:49:59.871662+00:00"} {"global_step": 236158, "acc_step": 0, "speed/wps": 5517.519405065623, "speed/FLOPS": 243846116479456.4, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.049649909138679504, "optim/lr": 1.0084760943632753e-05, "optim/total_tokens": 1981036888064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2686970233917236, "created_at": "2025-06-03T08:50:02.849244+00:00"} {"global_step": 236159, "acc_step": 0, "speed/wps": 5509.297310421385, "speed/FLOPS": 243482741980676.53, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04640628397464752, "optim/lr": 1.0081213718538428e-05, "optim/total_tokens": 1981045276672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2726714611053467, "created_at": "2025-06-03T08:50:05.827865+00:00"} {"global_step": 236160, "acc_step": 0, "speed/wps": 5509.26194350454, "speed/FLOPS": 243481178943976.25, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.35 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.35, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05024569109082222, "optim/lr": 1.0077666493443882e-05, "optim/total_tokens": 1981053665280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2586420774459839, "created_at": "2025-06-03T08:50:08.807210+00:00"} {"global_step": 236161, "acc_step": 0, "speed/wps": 5508.64686771514, "speed/FLOPS": 243453995742328.06, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04718074947595596, "optim/lr": 1.0074119268349336e-05, "optim/total_tokens": 1981062053888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2513326406478882, "created_at": "2025-06-03T08:50:11.788159+00:00"} {"global_step": 236162, "acc_step": 0, "speed/wps": 5518.4907053707775, "speed/FLOPS": 243889042981378.6, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04679626226425171, "optim/lr": 1.007057204325479e-05, "optim/total_tokens": 1981070442496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.273652195930481, "created_at": "2025-06-03T08:50:14.763069+00:00"} {"global_step": 236163, "acc_step": 0, "speed/wps": 5517.371353902502, "speed/FLOPS": 243839573375841.0, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04774489626288414, "optim/lr": 1.0067024818160465e-05, "optim/total_tokens": 1981078831104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2618874311447144, "created_at": "2025-06-03T08:50:17.737129+00:00"} {"global_step": 236164, "acc_step": 0, "speed/wps": 5529.151868162075, "speed/FLOPS": 244360211807975.97, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0458940789103508, "optim/lr": 1.0063477593065917e-05, "optim/total_tokens": 1981087219712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2536935806274414, "created_at": "2025-06-03T08:50:20.710377+00:00"} {"global_step": 236165, "acc_step": 0, "speed/wps": 5511.853364403735, "speed/FLOPS": 243595706483626.12, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0507102906703949, "optim/lr": 1.005993036797137e-05, "optim/total_tokens": 1981095608320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2638871669769287, "created_at": "2025-06-03T08:50:23.688012+00:00"} {"global_step": 236166, "acc_step": 0, "speed/wps": 5520.496163151745, "speed/FLOPS": 243977673950433.9, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046990033239126205, "optim/lr": 1.0056383142876824e-05, "optim/total_tokens": 1981103996928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2728818655014038, "created_at": "2025-06-03T08:50:26.664695+00:00"} {"global_step": 236167, "acc_step": 0, "speed/wps": 5504.357386881531, "speed/FLOPS": 243264422645035.78, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047956615686416626, "optim/lr": 1.00528359177825e-05, "optim/total_tokens": 1981112385536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2619366645812988, "created_at": "2025-06-03T08:50:29.645756+00:00"} {"global_step": 236168, "acc_step": 0, "speed/wps": 5511.227272919037, "speed/FLOPS": 243568036444629.2, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04901604354381561, "optim/lr": 1.0049288692687953e-05, "optim/total_tokens": 1981120774144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2748596668243408, "created_at": "2025-06-03T08:50:32.627735+00:00"} {"global_step": 236169, "acc_step": 0, "speed/wps": 5499.690905693664, "speed/FLOPS": 243058188061748.03, "speed/curr_iter_time": 2.9782, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9782, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.34 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.34, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047271888703107834, "optim/lr": 1.0045741467593405e-05, "optim/total_tokens": 1981129162752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2632074356079102, "created_at": "2025-06-03T08:50:35.616668+00:00"} {"global_step": 236170, "acc_step": 0, "speed/wps": 5514.619971970841, "speed/FLOPS": 243717976377310.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0471598356962204, "optim/lr": 1.0042194242498859e-05, "optim/total_tokens": 1981137551360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2597533464431763, "created_at": "2025-06-03T08:50:38.597638+00:00"} {"global_step": 236171, "acc_step": 0, "speed/wps": 5518.422787572465, "speed/FLOPS": 243886041362327.97, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05013106390833855, "optim/lr": 1.0038647017404534e-05, "optim/total_tokens": 1981145939968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2693973779678345, "created_at": "2025-06-03T08:50:41.574533+00:00"} {"global_step": 236172, "acc_step": 0, "speed/wps": 5523.376372928064, "speed/FLOPS": 244104964480297.12, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04593144729733467, "optim/lr": 1.0035099792309988e-05, "optim/total_tokens": 1981154328576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2493419647216797, "created_at": "2025-06-03T08:50:44.551352+00:00"} {"global_step": 236173, "acc_step": 0, "speed/wps": 5511.649280422199, "speed/FLOPS": 243586687016238.72, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05236406996846199, "optim/lr": 1.0031552567215441e-05, "optim/total_tokens": 1981162717184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2649332284927368, "created_at": "2025-06-03T08:50:47.528878+00:00"} {"global_step": 236174, "acc_step": 0, "speed/wps": 5525.060979505983, "speed/FLOPS": 244179415468443.03, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047420717775821686, "optim/lr": 1.0028005342120893e-05, "optim/total_tokens": 1981171105792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2551367282867432, "created_at": "2025-06-03T08:50:50.498452+00:00"} {"global_step": 236175, "acc_step": 0, "speed/wps": 5525.208679672345, "speed/FLOPS": 244185943059798.28, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050499171018600464, "optim/lr": 1.0024458117026569e-05, "optim/total_tokens": 1981179494400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.252480149269104, "created_at": "2025-06-03T08:50:53.468495+00:00"} {"global_step": 236176, "acc_step": 0, "speed/wps": 5514.5770339427845, "speed/FLOPS": 243716078736247.62, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0481213815510273, "optim/lr": 1.0020910891932022e-05, "optim/total_tokens": 1981187883008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2725800275802612, "created_at": "2025-06-03T08:50:56.449697+00:00"} {"global_step": 236177, "acc_step": 0, "speed/wps": 5512.857299001051, "speed/FLOPS": 243640075254224.38, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04868042841553688, "optim/lr": 1.0017363666837476e-05, "optim/total_tokens": 1981196271616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2794417142868042, "created_at": "2025-06-03T08:50:59.426812+00:00"} {"global_step": 236178, "acc_step": 0, "speed/wps": 5509.717892567877, "speed/FLOPS": 243501329558816.9, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047008391469717026, "optim/lr": 1.001381644174293e-05, "optim/total_tokens": 1981204660224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2655612230300903, "created_at": "2025-06-03T08:51:02.407631+00:00"} {"global_step": 236179, "acc_step": 0, "speed/wps": 5512.954129267344, "speed/FLOPS": 243644354656372.28, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046853162348270416, "optim/lr": 1.0010269216648603e-05, "optim/total_tokens": 1981213048832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2712373733520508, "created_at": "2025-06-03T08:51:05.384131+00:00"} {"global_step": 236180, "acc_step": 0, "speed/wps": 5518.2592915192345, "speed/FLOPS": 243878815673623.84, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.33 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.33, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04982050135731697, "optim/lr": 1.0006721991554057e-05, "optim/total_tokens": 1981221437440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2606191635131836, "created_at": "2025-06-03T08:51:08.360849+00:00"} {"global_step": 236181, "acc_step": 0, "speed/wps": 5522.748861259045, "speed/FLOPS": 244077231676422.4, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047428395599126816, "optim/lr": 1.000317476645951e-05, "optim/total_tokens": 1981229826048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2732983827590942, "created_at": "2025-06-03T08:51:11.333112+00:00"} {"global_step": 236182, "acc_step": 0, "speed/wps": 5524.39573189555, "speed/FLOPS": 244150014929107.84, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05202498286962509, "optim/lr": 9.999627541365186e-06, "optim/total_tokens": 1981238214656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2650812864303589, "created_at": "2025-06-03T08:51:14.303221+00:00"} {"global_step": 236183, "acc_step": 0, "speed/wps": 5513.504170295257, "speed/FLOPS": 243668663654440.84, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04903284087777138, "optim/lr": 9.99608031627064e-06, "optim/total_tokens": 1981246603264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.260413408279419, "created_at": "2025-06-03T08:51:17.281660+00:00"} {"global_step": 236184, "acc_step": 0, "speed/wps": 5524.175614758227, "speed/FLOPS": 244140286878299.84, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04649592563509941, "optim/lr": 9.992533091176092e-06, "optim/total_tokens": 1981254991872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2677021026611328, "created_at": "2025-06-03T08:51:20.255201+00:00"} {"global_step": 236185, "acc_step": 0, "speed/wps": 5512.393554507506, "speed/FLOPS": 243619580121269.22, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05040634050965309, "optim/lr": 9.988985866081545e-06, "optim/total_tokens": 1981263380480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2666881084442139, "created_at": "2025-06-03T08:51:23.233001+00:00"} {"global_step": 236186, "acc_step": 0, "speed/wps": 5524.953571526158, "speed/FLOPS": 244174668585498.66, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047653790563344955, "optim/lr": 9.98543864098722e-06, "optim/total_tokens": 1981271769088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2691982984542847, "created_at": "2025-06-03T08:51:26.203273+00:00"} {"global_step": 236187, "acc_step": 0, "speed/wps": 5530.9880581247635, "speed/FLOPS": 244441362005854.6, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.19, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048786699771881104, "optim/lr": 9.981891415892674e-06, "optim/total_tokens": 1981280157696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2645114660263062, "created_at": "2025-06-03T08:51:29.170368+00:00"} {"global_step": 236188, "acc_step": 0, "speed/wps": 5530.705281138713, "speed/FLOPS": 244428864710455.0, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05166879668831825, "optim/lr": 9.978344190798128e-06, "optim/total_tokens": 1981288546304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2586654424667358, "created_at": "2025-06-03T08:51:32.137244+00:00"} {"global_step": 236189, "acc_step": 0, "speed/wps": 5532.632067961668, "speed/FLOPS": 244514018825840.62, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046057846397161484, "optim/lr": 9.974796965703582e-06, "optim/total_tokens": 1981296934912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2708075046539307, "created_at": "2025-06-03T08:51:35.104189+00:00"} {"global_step": 236190, "acc_step": 0, "speed/wps": 5520.45366755826, "speed/FLOPS": 243975795862714.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050813525915145874, "optim/lr": 9.971249740609255e-06, "optim/total_tokens": 1981305323520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2573797702789307, "created_at": "2025-06-03T08:51:38.076853+00:00"} {"global_step": 236191, "acc_step": 0, "speed/wps": 5513.0914769809315, "speed/FLOPS": 243650424722303.53, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04911762475967407, "optim/lr": 9.967702515514709e-06, "optim/total_tokens": 1981313712128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2536075115203857, "created_at": "2025-06-03T08:51:41.053185+00:00"} {"global_step": 236192, "acc_step": 0, "speed/wps": 5522.702730867269, "speed/FLOPS": 244075192949222.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04678360000252724, "optim/lr": 9.964155290420163e-06, "optim/total_tokens": 1981322100736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2679362297058105, "created_at": "2025-06-03T08:51:44.029563+00:00"} {"global_step": 236193, "acc_step": 0, "speed/wps": 5509.674143900929, "speed/FLOPS": 243499396091663.78, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05020427703857422, "optim/lr": 9.960608065325616e-06, "optim/total_tokens": 1981330489344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2734869718551636, "created_at": "2025-06-03T08:51:47.012477+00:00"} {"global_step": 236194, "acc_step": 0, "speed/wps": 5516.847269100902, "speed/FLOPS": 243816411510119.47, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04974307492375374, "optim/lr": 9.957060840231292e-06, "optim/total_tokens": 1981338877952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2719794511795044, "created_at": "2025-06-03T08:51:49.987979+00:00"} {"global_step": 236195, "acc_step": 0, "speed/wps": 5507.883289615986, "speed/FLOPS": 243420249498692.47, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04673770070075989, "optim/lr": 9.953513615136744e-06, "optim/total_tokens": 1981347266560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2667068243026733, "created_at": "2025-06-03T08:51:52.972524+00:00"} {"global_step": 236196, "acc_step": 0, "speed/wps": 5496.40702077535, "speed/FLOPS": 242913057156805.28, "speed/curr_iter_time": 2.9799, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9799, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.32 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.32, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04978082701563835, "optim/lr": 9.949966390042197e-06, "optim/total_tokens": 1981355655168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.26466703414917, "created_at": "2025-06-03T08:51:55.963763+00:00"} {"global_step": 236197, "acc_step": 0, "speed/wps": 5440.8219026777615, "speed/FLOPS": 240456479447317.78, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05016910657286644, "optim/lr": 9.946419164947651e-06, "optim/total_tokens": 1981364043776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2614248991012573, "created_at": "2025-06-03T08:51:58.984412+00:00"} {"global_step": 236198, "acc_step": 0, "speed/wps": 5527.365946087526, "speed/FLOPS": 244281283193458.78, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04656552895903587, "optim/lr": 9.942871939853326e-06, "optim/total_tokens": 1981372432384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2611017227172852, "created_at": "2025-06-03T08:52:01.957621+00:00"} {"global_step": 236199, "acc_step": 0, "speed/wps": 5523.845918778751, "speed/FLOPS": 244125716003544.0, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05139826983213425, "optim/lr": 9.93932471475878e-06, "optim/total_tokens": 1981380820992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2579905986785889, "created_at": "2025-06-03T08:52:04.933977+00:00"} {"global_step": 236200, "acc_step": 0, "speed/wps": 5509.465802413414, "speed/FLOPS": 243490188464304.03, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04795568436384201, "optim/lr": 9.935777489664232e-06, "optim/total_tokens": 1981389209600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.268246054649353, "created_at": "2025-06-03T08:52:07.915360+00:00"} {"global_step": 236201, "acc_step": 0, "speed/wps": 5514.602871616634, "speed/FLOPS": 243717220629182.56, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04799053817987442, "optim/lr": 9.932230264569686e-06, "optim/total_tokens": 1981397598208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2677072286605835, "created_at": "2025-06-03T08:52:10.891376+00:00"} {"global_step": 236202, "acc_step": 0, "speed/wps": 5522.1801063645535, "speed/FLOPS": 244052095621237.3, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.052491575479507446, "optim/lr": 9.928683039475361e-06, "optim/total_tokens": 1981405986816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2680485248565674, "created_at": "2025-06-03T08:52:13.867459+00:00"} {"global_step": 236203, "acc_step": 0, "speed/wps": 5518.180023825625, "speed/FLOPS": 243875312447295.12, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.31 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.31, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046433158218860626, "optim/lr": 9.925135814380815e-06, "optim/total_tokens": 1981414375424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2632642984390259, "created_at": "2025-06-03T08:52:16.841914+00:00"} {"global_step": 236204, "acc_step": 0, "speed/wps": 5526.074734337529, "speed/FLOPS": 244224218243129.75, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047005344182252884, "optim/lr": 9.921588589286268e-06, "optim/total_tokens": 1981422764032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.266891360282898, "created_at": "2025-06-03T08:52:19.815634+00:00"} {"global_step": 236205, "acc_step": 0, "speed/wps": 5519.887514302453, "speed/FLOPS": 243950774786642.44, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.053193747997283936, "optim/lr": 9.91804136419172e-06, "optim/total_tokens": 1981431152640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2727123498916626, "created_at": "2025-06-03T08:52:22.791260+00:00"} {"global_step": 236206, "acc_step": 0, "speed/wps": 5527.401340896325, "speed/FLOPS": 244282847462840.62, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0460277758538723, "optim/lr": 9.914494139097396e-06, "optim/total_tokens": 1981439541248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2671552896499634, "created_at": "2025-06-03T08:52:25.764324+00:00"} {"global_step": 236207, "acc_step": 0, "speed/wps": 5514.567070510879, "speed/FLOPS": 243715638403554.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04744986444711685, "optim/lr": 9.91094691400285e-06, "optim/total_tokens": 1981447929856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2694745063781738, "created_at": "2025-06-03T08:52:28.744831+00:00"} {"global_step": 236208, "acc_step": 0, "speed/wps": 5515.121359970303, "speed/FLOPS": 243740135160550.78, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05090968310832977, "optim/lr": 9.907399688908303e-06, "optim/total_tokens": 1981456318464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2706434726715088, "created_at": "2025-06-03T08:52:31.723766+00:00"} {"global_step": 236209, "acc_step": 0, "speed/wps": 5517.049330649622, "speed/FLOPS": 243825341596328.12, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04968535155057907, "optim/lr": 9.903852463813979e-06, "optim/total_tokens": 1981464707072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2634402513504028, "created_at": "2025-06-03T08:52:34.699811+00:00"} {"global_step": 236210, "acc_step": 0, "speed/wps": 5507.558375698116, "speed/FLOPS": 243405889966582.8, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048285502940416336, "optim/lr": 9.900305238719432e-06, "optim/total_tokens": 1981473095680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2787519693374634, "created_at": "2025-06-03T08:52:37.679145+00:00"} {"global_step": 236211, "acc_step": 0, "speed/wps": 5508.1481367620445, "speed/FLOPS": 243431954386937.7, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05655297264456749, "optim/lr": 9.896758013624884e-06, "optim/total_tokens": 1981481484288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2563143968582153, "created_at": "2025-06-03T08:52:40.662216+00:00"} {"global_step": 236212, "acc_step": 0, "speed/wps": 5515.181751792977, "speed/FLOPS": 243742804169999.56, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.047091610729694366, "optim/lr": 9.893210788530338e-06, "optim/total_tokens": 1981489872896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2599049806594849, "created_at": "2025-06-03T08:52:43.640939+00:00"} {"global_step": 236213, "acc_step": 0, "speed/wps": 5520.03631411745, "speed/FLOPS": 243957350976838.8, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05576860532164574, "optim/lr": 9.889663563436013e-06, "optim/total_tokens": 1981498261504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2655786275863647, "created_at": "2025-06-03T08:52:46.615177+00:00"} {"global_step": 236214, "acc_step": 0, "speed/wps": 5519.990247648442, "speed/FLOPS": 243955315074698.22, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04903838410973549, "optim/lr": 9.886116338341467e-06, "optim/total_tokens": 1981506650112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2668946981430054, "created_at": "2025-06-03T08:52:49.589655+00:00"} {"global_step": 236215, "acc_step": 0, "speed/wps": 5517.324431248343, "speed/FLOPS": 243837499634699.1, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.3 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.3, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04707622900605202, "optim/lr": 9.88256911324692e-06, "optim/total_tokens": 1981515038720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2705641984939575, "created_at": "2025-06-03T08:52:52.563860+00:00"} {"global_step": 236216, "acc_step": 0, "speed/wps": 5528.063662087859, "speed/FLOPS": 244312118669439.25, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.0508972629904747, "optim/lr": 9.879021888152372e-06, "optim/total_tokens": 1981523427328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2491916418075562, "created_at": "2025-06-03T08:52:55.537642+00:00"} {"global_step": 236217, "acc_step": 0, "speed/wps": 5522.084157281903, "speed/FLOPS": 244047855162896.1, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05230909585952759, "optim/lr": 9.875474663058048e-06, "optim/total_tokens": 1981531815936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2741998434066772, "created_at": "2025-06-03T08:52:58.513213+00:00"} {"global_step": 236218, "acc_step": 0, "speed/wps": 5522.3883526739655, "speed/FLOPS": 244061299042212.1, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046262145042419434, "optim/lr": 9.871927437963501e-06, "optim/total_tokens": 1981540204544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2594352960586548, "created_at": "2025-06-03T08:53:01.484451+00:00"} {"global_step": 236219, "acc_step": 0, "speed/wps": 5527.297790985425, "speed/FLOPS": 244278271086795.38, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04991869255900383, "optim/lr": 9.868380212868955e-06, "optim/total_tokens": 1981548593152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2580358982086182, "created_at": "2025-06-03T08:53:04.453324+00:00"} {"global_step": 236220, "acc_step": 0, "speed/wps": 5528.188019944495, "speed/FLOPS": 244317614650181.38, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050048887729644775, "optim/lr": 9.864832987774409e-06, "optim/total_tokens": 1981556981760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2734684944152832, "created_at": "2025-06-03T08:53:07.421768+00:00"} {"global_step": 236221, "acc_step": 0, "speed/wps": 5521.374515817295, "speed/FLOPS": 244016492642434.72, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046269092708826065, "optim/lr": 9.861285762680084e-06, "optim/total_tokens": 1981565370368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2674553394317627, "created_at": "2025-06-03T08:53:10.397113+00:00"} {"global_step": 236222, "acc_step": 0, "speed/wps": 5522.1066757552635, "speed/FLOPS": 244048850364158.62, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04725515469908714, "optim/lr": 9.857738537585536e-06, "optim/total_tokens": 1981573758976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2574268579483032, "created_at": "2025-06-03T08:53:13.368772+00:00"} {"global_step": 236223, "acc_step": 0, "speed/wps": 5530.240610535427, "speed/FLOPS": 244408328648189.5, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.05039503797888756, "optim/lr": 9.85419131249099e-06, "optim/total_tokens": 1981582147584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2766965627670288, "created_at": "2025-06-03T08:53:16.339881+00:00"} {"global_step": 236224, "acc_step": 0, "speed/wps": 5526.88394919379, "speed/FLOPS": 244259981397839.38, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.046504825353622437, "optim/lr": 9.850644087396443e-06, "optim/total_tokens": 1981590536192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2600467205047607, "created_at": "2025-06-03T08:53:19.308507+00:00"} {"global_step": 236225, "acc_step": 0, "speed/wps": 5520.30397306291, "speed/FLOPS": 243969180132225.44, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.045663002878427505, "optim/lr": 9.847096862302119e-06, "optim/total_tokens": 1981598924800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2481193542480469, "created_at": "2025-06-03T08:53:22.281216+00:00"} {"global_step": 236226, "acc_step": 0, "speed/wps": 5515.405103884224, "speed/FLOPS": 243752675189213.06, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.29 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.29, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048882998526096344, "optim/lr": 9.843549637207572e-06, "optim/total_tokens": 1981607313408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2640416622161865, "created_at": "2025-06-03T08:53:25.258166+00:00"} {"global_step": 236227, "acc_step": 0, "speed/wps": 5522.300475252771, "speed/FLOPS": 244057415309992.72, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.04694958031177521, "optim/lr": 9.840002412113024e-06, "optim/total_tokens": 1981615702016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2620147466659546, "created_at": "2025-06-03T08:53:28.230713+00:00"} {"global_step": 236228, "acc_step": 0, "speed/wps": 5521.161528421956, "speed/FLOPS": 244007079689729.03, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048220161348581314, "optim/lr": 9.836455187018478e-06, "optim/total_tokens": 1981624090624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2705432176589966, "created_at": "2025-06-03T08:53:31.207062+00:00"} {"global_step": 236229, "acc_step": 0, "speed/wps": 5522.882106216118, "speed/FLOPS": 244083120421515.5, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.050175316631793976, "optim/lr": 9.832907961924153e-06, "optim/total_tokens": 1981632479232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2806154489517212, "created_at": "2025-06-03T08:53:34.180791+00:00"} {"global_step": 236230, "acc_step": 0, "speed/wps": 5530.442562113056, "speed/FLOPS": 244417253874238.8, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046626124531030655, "optim/lr": 9.829360736829607e-06, "optim/total_tokens": 1981640867840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.269085168838501, "created_at": "2025-06-03T08:53:37.148056+00:00"} {"global_step": 236231, "acc_step": 0, "speed/wps": 5520.961100912264, "speed/FLOPS": 243998221819681.62, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048852041363716125, "optim/lr": 9.82581351173506e-06, "optim/total_tokens": 1981649256448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2677088975906372, "created_at": "2025-06-03T08:53:40.123970+00:00"} {"global_step": 236232, "acc_step": 0, "speed/wps": 5536.524498048159, "speed/FLOPS": 244686044312400.25, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.13, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04678776115179062, "optim/lr": 9.822266286640513e-06, "optim/total_tokens": 1981657645056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2739739418029785, "created_at": "2025-06-03T08:53:43.087677+00:00"} {"global_step": 236233, "acc_step": 0, "speed/wps": 5526.615508136361, "speed/FLOPS": 244248117677106.94, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04889874532818794, "optim/lr": 9.818719061546188e-06, "optim/total_tokens": 1981666033664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2588814496994019, "created_at": "2025-06-03T08:53:46.057159+00:00"} {"global_step": 236234, "acc_step": 0, "speed/wps": 5531.212369713936, "speed/FLOPS": 244451275429965.22, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048828162252902985, "optim/lr": 9.815171836451642e-06, "optim/total_tokens": 1981674422272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2501649856567383, "created_at": "2025-06-03T08:53:49.023982+00:00"} {"global_step": 236235, "acc_step": 0, "speed/wps": 5524.597255073199, "speed/FLOPS": 244158921222070.8, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048515334725379944, "optim/lr": 9.811624611357095e-06, "optim/total_tokens": 1981682810880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2663748264312744, "created_at": "2025-06-03T08:53:51.994146+00:00"} {"global_step": 236236, "acc_step": 0, "speed/wps": 5515.329915439763, "speed/FLOPS": 243749352244817.22, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.1, "optim/grad_norm": 0.048111747950315475, "optim/lr": 9.808077386262771e-06, "optim/total_tokens": 1981691199488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2650668621063232, "created_at": "2025-06-03T08:53:54.969254+00:00"} {"global_step": 236237, "acc_step": 0, "speed/wps": 5523.431703629757, "speed/FLOPS": 244107409814103.78, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04767830669879913, "optim/lr": 9.804530161168223e-06, "optim/total_tokens": 1981699588096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2583509683609009, "created_at": "2025-06-03T08:53:57.940083+00:00"} {"global_step": 236238, "acc_step": 0, "speed/wps": 5522.057531856225, "speed/FLOPS": 244046678455362.4, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04726589098572731, "optim/lr": 9.800982936073676e-06, "optim/total_tokens": 1981707976704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2666360139846802, "created_at": "2025-06-03T08:54:00.913746+00:00"} {"global_step": 236239, "acc_step": 0, "speed/wps": 5533.952635805145, "speed/FLOPS": 244572381165243.34, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047900233417749405, "optim/lr": 9.79743571097913e-06, "optim/total_tokens": 1981716365312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2596129179000854, "created_at": "2025-06-03T08:54:03.878768+00:00"} {"global_step": 236240, "acc_step": 0, "speed/wps": 5532.471760598882, "speed/FLOPS": 244506934060932.94, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.28, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04743048548698425, "optim/lr": 9.793888485884806e-06, "optim/total_tokens": 1981724753920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2630966901779175, "created_at": "2025-06-03T08:54:06.848555+00:00"} {"global_step": 236241, "acc_step": 0, "speed/wps": 5531.405760575041, "speed/FLOPS": 244459822316161.94, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.22, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0468270368874073, "optim/lr": 9.790341260790259e-06, "optim/total_tokens": 1981733142528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.253122329711914, "created_at": "2025-06-03T08:54:09.815457+00:00"} {"global_step": 236242, "acc_step": 0, "speed/wps": 5521.924700631647, "speed/FLOPS": 244040807995127.9, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04840345308184624, "optim/lr": 9.786794035695713e-06, "optim/total_tokens": 1981741531136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2629255056381226, "created_at": "2025-06-03T08:54:12.787246+00:00"} {"global_step": 236243, "acc_step": 0, "speed/wps": 5519.002341914167, "speed/FLOPS": 243911654697803.2, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046219270676374435, "optim/lr": 9.783246810601165e-06, "optim/total_tokens": 1981749919744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2712100744247437, "created_at": "2025-06-03T08:54:15.760354+00:00"} {"global_step": 236244, "acc_step": 0, "speed/wps": 5510.472208607516, "speed/FLOPS": 243534666466829.47, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.28 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.28, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04748465120792389, "optim/lr": 9.77969958550684e-06, "optim/total_tokens": 1981758308352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2606548070907593, "created_at": "2025-06-03T08:54:18.742060+00:00"} {"global_step": 236245, "acc_step": 0, "speed/wps": 5512.206313834803, "speed/FLOPS": 243611305041920.34, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.049259722232818604, "optim/lr": 9.776152360412294e-06, "optim/total_tokens": 1981766696960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2679888010025024, "created_at": "2025-06-03T08:54:21.718838+00:00"} {"global_step": 236246, "acc_step": 0, "speed/wps": 5528.466551464263, "speed/FLOPS": 244329924317701.56, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04731963947415352, "optim/lr": 9.772605135317747e-06, "optim/total_tokens": 1981775085568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2633705139160156, "created_at": "2025-06-03T08:54:24.686938+00:00"} {"global_step": 236247, "acc_step": 0, "speed/wps": 5535.925765933823, "speed/FLOPS": 244659583417535.38, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.16, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04849467799067497, "optim/lr": 9.769057910223201e-06, "optim/total_tokens": 1981783474176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2650374174118042, "created_at": "2025-06-03T08:54:27.652641+00:00"} {"global_step": 236248, "acc_step": 0, "speed/wps": 5520.7399606060335, "speed/FLOPS": 243988448550044.97, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046521734446287155, "optim/lr": 9.765510685128875e-06, "optim/total_tokens": 1981791862784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2828733921051025, "created_at": "2025-06-03T08:54:30.630450+00:00"} {"global_step": 236249, "acc_step": 0, "speed/wps": 5523.7759356641245, "speed/FLOPS": 244122623108083.53, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04789280146360397, "optim/lr": 9.761963460034328e-06, "optim/total_tokens": 1981800251392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2555639743804932, "created_at": "2025-06-03T08:54:33.604397+00:00"} {"global_step": 236250, "acc_step": 0, "speed/wps": 5523.812687234134, "speed/FLOPS": 244124247339366.34, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.27 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.27, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04774148762226105, "optim/lr": 9.758416234939782e-06, "optim/total_tokens": 1981808640000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2503702640533447, "created_at": "2025-06-03T08:54:36.577716+00:00"} {"global_step": 236251, "acc_step": 0, "speed/wps": 5529.473372743777, "speed/FLOPS": 244374420664877.6, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.29, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04633967578411102, "optim/lr": 9.754869009845236e-06, "optim/total_tokens": 1981817028608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.26211416721344, "created_at": "2025-06-03T08:54:39.545093+00:00"} {"global_step": 236252, "acc_step": 0, "speed/wps": 5522.044070390406, "speed/FLOPS": 244046083527475.25, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046717241406440735, "optim/lr": 9.751321784750911e-06, "optim/total_tokens": 1981825417216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2527577877044678, "created_at": "2025-06-03T08:54:42.519919+00:00"} {"global_step": 236253, "acc_step": 0, "speed/wps": 5519.500701764055, "speed/FLOPS": 243933679652331.25, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04716593772172928, "optim/lr": 9.747774559656363e-06, "optim/total_tokens": 1981833805824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.273455023765564, "created_at": "2025-06-03T08:54:45.494503+00:00"} {"global_step": 236254, "acc_step": 0, "speed/wps": 5535.013348049062, "speed/FLOPS": 244619259217207.03, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04693010821938515, "optim/lr": 9.744227334561817e-06, "optim/total_tokens": 1981842194432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2597671747207642, "created_at": "2025-06-03T08:54:48.462205+00:00"} {"global_step": 236255, "acc_step": 0, "speed/wps": 5523.337476399684, "speed/FLOPS": 244103245452833.25, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04620734229683876, "optim/lr": 9.74068010946727e-06, "optim/total_tokens": 1981850583040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2670979499816895, "created_at": "2025-06-03T08:54:51.433133+00:00"} {"global_step": 236256, "acc_step": 0, "speed/wps": 5526.434900631244, "speed/FLOPS": 244240135749813.75, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04657081142067909, "optim/lr": 9.737132884372946e-06, "optim/total_tokens": 1981858971648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2754167318344116, "created_at": "2025-06-03T08:54:54.402098+00:00"} {"global_step": 236257, "acc_step": 0, "speed/wps": 5514.5563534334015, "speed/FLOPS": 243715164763585.3, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04672293737530708, "optim/lr": 9.7335856592784e-06, "optim/total_tokens": 1981867360256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2635506391525269, "created_at": "2025-06-03T08:54:57.379815+00:00"} {"global_step": 236258, "acc_step": 0, "speed/wps": 5532.7831826578795, "speed/FLOPS": 244520697321938.03, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.18, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04756820574402809, "optim/lr": 9.730038434183851e-06, "optim/total_tokens": 1981875748864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2735563516616821, "created_at": "2025-06-03T08:55:00.349423+00:00"} {"global_step": 236259, "acc_step": 0, "speed/wps": 5526.383600743689, "speed/FLOPS": 244237868557360.47, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046068526804447174, "optim/lr": 9.726491209089305e-06, "optim/total_tokens": 1981884137472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2609211206436157, "created_at": "2025-06-03T08:55:03.318558+00:00"} {"global_step": 236260, "acc_step": 0, "speed/wps": 5529.146884185598, "speed/FLOPS": 244359991541726.0, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04643333703279495, "optim/lr": 9.72294398399498e-06, "optim/total_tokens": 1981892526080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2680079936981201, "created_at": "2025-06-03T08:55:06.289650+00:00"} {"global_step": 236261, "acc_step": 0, "speed/wps": 5530.509112654148, "speed/FLOPS": 244420195067518.56, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0474429726600647, "optim/lr": 9.719396758900434e-06, "optim/total_tokens": 1981900914688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.271209955215454, "created_at": "2025-06-03T08:55:09.256956+00:00"} {"global_step": 236262, "acc_step": 0, "speed/wps": 5519.9370776990445, "speed/FLOPS": 243952965235083.3, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.26 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.26, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048680949956178665, "optim/lr": 9.715849533805888e-06, "optim/total_tokens": 1981909303296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2760618925094604, "created_at": "2025-06-03T08:55:12.229420+00:00"} {"global_step": 236263, "acc_step": 0, "speed/wps": 5531.142470676533, "speed/FLOPS": 244448186250287.72, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04724648967385292, "optim/lr": 9.712302308711563e-06, "optim/total_tokens": 1981917691904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2698988914489746, "created_at": "2025-06-03T08:55:15.199921+00:00"} {"global_step": 236264, "acc_step": 0, "speed/wps": 5523.556724645516, "speed/FLOPS": 244112935103084.75, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04660513252019882, "optim/lr": 9.708755083617015e-06, "optim/total_tokens": 1981926080512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2762494087219238, "created_at": "2025-06-03T08:55:18.174788+00:00"} {"global_step": 236265, "acc_step": 0, "speed/wps": 5534.186441088054, "speed/FLOPS": 244582714162024.0, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.12, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05853673443198204, "optim/lr": 9.705207858522469e-06, "optim/total_tokens": 1981934469120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2637139558792114, "created_at": "2025-06-03T08:55:21.143256+00:00"} {"global_step": 236266, "acc_step": 0, "speed/wps": 5526.482081240486, "speed/FLOPS": 244242220891250.0, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048043616116046906, "optim/lr": 9.701660633427922e-06, "optim/total_tokens": 1981942857728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.275107979774475, "created_at": "2025-06-03T08:55:24.112259+00:00"} {"global_step": 236267, "acc_step": 0, "speed/wps": 5531.953000911453, "speed/FLOPS": 244484007538001.38, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04600046947598457, "optim/lr": 9.698113408333598e-06, "optim/total_tokens": 1981951246336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2519344091415405, "created_at": "2025-06-03T08:55:27.078292+00:00"} {"global_step": 236268, "acc_step": 0, "speed/wps": 5514.661655635976, "speed/FLOPS": 243719818581953.6, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04921635612845421, "optim/lr": 9.694566183239051e-06, "optim/total_tokens": 1981959634944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2483434677124023, "created_at": "2025-06-03T08:55:30.057245+00:00"} {"global_step": 236269, "acc_step": 0, "speed/wps": 5516.618448679251, "speed/FLOPS": 243806298818691.6, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046776920557022095, "optim/lr": 9.691018958144503e-06, "optim/total_tokens": 1981968023552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2668635845184326, "created_at": "2025-06-03T08:55:33.031551+00:00"} {"global_step": 236270, "acc_step": 0, "speed/wps": 5523.807906701269, "speed/FLOPS": 244124036064282.72, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04593784734606743, "optim/lr": 9.687471733049957e-06, "optim/total_tokens": 1981976412160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2412019968032837, "created_at": "2025-06-03T08:55:36.002698+00:00"} {"global_step": 236271, "acc_step": 0, "speed/wps": 5531.086962776253, "speed/FLOPS": 244445733085210.56, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.35, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04711433872580528, "optim/lr": 9.683924507955633e-06, "optim/total_tokens": 1981984800768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2750672101974487, "created_at": "2025-06-03T08:55:38.971032+00:00"} {"global_step": 236272, "acc_step": 0, "speed/wps": 5535.781912459571, "speed/FLOPS": 244653225830282.25, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.08, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04745013266801834, "optim/lr": 9.680377282861086e-06, "optim/total_tokens": 1981993189376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2552765607833862, "created_at": "2025-06-03T08:55:41.935367+00:00"} {"global_step": 236273, "acc_step": 0, "speed/wps": 5530.464037832536, "speed/FLOPS": 244418202991117.12, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046596355736255646, "optim/lr": 9.67683005776654e-06, "optim/total_tokens": 1982001577984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2654693126678467, "created_at": "2025-06-03T08:55:44.902191+00:00"} {"global_step": 236274, "acc_step": 0, "speed/wps": 5515.821681193952, "speed/FLOPS": 243771085774067.06, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047302134335041046, "optim/lr": 9.673282832671992e-06, "optim/total_tokens": 1982009966592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2557902336120605, "created_at": "2025-06-03T08:55:47.878634+00:00"} {"global_step": 236275, "acc_step": 0, "speed/wps": 5516.643815049186, "speed/FLOPS": 243807419882405.88, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04711335897445679, "optim/lr": 9.669735607577667e-06, "optim/total_tokens": 1982018355200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2711085081100464, "created_at": "2025-06-03T08:55:50.857884+00:00"} {"global_step": 236276, "acc_step": 0, "speed/wps": 5507.978195716654, "speed/FLOPS": 243424443862568.56, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04672705754637718, "optim/lr": 9.66618838248312e-06, "optim/total_tokens": 1982026743808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2684077024459839, "created_at": "2025-06-03T08:55:53.837294+00:00"} {"global_step": 236277, "acc_step": 0, "speed/wps": 5516.320549576036, "speed/FLOPS": 243793133203115.3, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04601048305630684, "optim/lr": 9.662641157388574e-06, "optim/total_tokens": 1982035132416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.267449140548706, "created_at": "2025-06-03T08:55:56.814361+00:00"} {"global_step": 236278, "acc_step": 0, "speed/wps": 5515.585631870505, "speed/FLOPS": 243760653602180.66, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0466591902077198, "optim/lr": 9.659093932294028e-06, "optim/total_tokens": 1982043521024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2618519067764282, "created_at": "2025-06-03T08:55:59.793965+00:00"} {"global_step": 236279, "acc_step": 0, "speed/wps": 5514.23425336827, "speed/FLOPS": 243700929589364.12, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.25 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.25, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04686201736330986, "optim/lr": 9.655546707199704e-06, "optim/total_tokens": 1982051909632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2708399295806885, "created_at": "2025-06-03T08:56:02.773132+00:00"} {"global_step": 236280, "acc_step": 0, "speed/wps": 5516.368598529927, "speed/FLOPS": 243795256720940.47, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04625973477959633, "optim/lr": 9.651999482105155e-06, "optim/total_tokens": 1982060298240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2622624635696411, "created_at": "2025-06-03T08:56:05.752020+00:00"} {"global_step": 236281, "acc_step": 0, "speed/wps": 5525.0419528930815, "speed/FLOPS": 244178574589539.84, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04872192069888115, "optim/lr": 9.648452257010609e-06, "optim/total_tokens": 1982068686848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2642145156860352, "created_at": "2025-06-03T08:56:08.728161+00:00"} {"global_step": 236282, "acc_step": 0, "speed/wps": 5523.411932132508, "speed/FLOPS": 244106536015125.06, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04734165221452713, "optim/lr": 9.644905031916063e-06, "optim/total_tokens": 1982077075456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2717121839523315, "created_at": "2025-06-03T08:56:11.699441+00:00"} {"global_step": 236283, "acc_step": 0, "speed/wps": 5512.578386966663, "speed/FLOPS": 243627748769905.62, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04908758029341698, "optim/lr": 9.641357806821738e-06, "optim/total_tokens": 1982085464064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2720173597335815, "created_at": "2025-06-03T08:56:14.676402+00:00"} {"global_step": 236284, "acc_step": 0, "speed/wps": 5522.640518972386, "speed/FLOPS": 244072443501898.2, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04790564253926277, "optim/lr": 9.637810581727192e-06, "optim/total_tokens": 1982093852672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2676371335983276, "created_at": "2025-06-03T08:56:17.648493+00:00"} {"global_step": 236285, "acc_step": 0, "speed/wps": 5514.776677504379, "speed/FLOPS": 243724901959801.72, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04961425065994263, "optim/lr": 9.634263356632644e-06, "optim/total_tokens": 1982102241280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2774863243103027, "created_at": "2025-06-03T08:56:20.626070+00:00"} {"global_step": 236286, "acc_step": 0, "speed/wps": 5516.984544859359, "speed/FLOPS": 243822478396002.25, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04797479137778282, "optim/lr": 9.630716131538097e-06, "optim/total_tokens": 1982110629888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.273710012435913, "created_at": "2025-06-03T08:56:23.604082+00:00"} {"global_step": 236287, "acc_step": 0, "speed/wps": 5509.756904236889, "speed/FLOPS": 243503053674907.4, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.24 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.24, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04721613973379135, "optim/lr": 9.627168906443773e-06, "optim/total_tokens": 1982119018496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2606003284454346, "created_at": "2025-06-03T08:56:26.583408+00:00"} {"global_step": 236288, "acc_step": 0, "speed/wps": 5539.981734045169, "speed/FLOPS": 244838836447730.1, "speed/curr_iter_time": 2.955, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.955, "speed/est_time_elapsed": "8.08 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 193.95, "speed/est_time_elapsed_days": 8.08, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04939146339893341, "optim/lr": 9.623621681349226e-06, "optim/total_tokens": 1982127407104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2652188539505005, "created_at": "2025-06-03T08:56:29.547712+00:00"} {"global_step": 236289, "acc_step": 0, "speed/wps": 5532.971685108872, "speed/FLOPS": 244529028165428.9, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047204602509737015, "optim/lr": 9.62007445625468e-06, "optim/total_tokens": 1982135795712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2584373950958252, "created_at": "2025-06-03T08:56:32.518038+00:00"} {"global_step": 236290, "acc_step": 0, "speed/wps": 5532.938724769786, "speed/FLOPS": 244527571487147.6, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04587191715836525, "optim/lr": 9.616527231160354e-06, "optim/total_tokens": 1982144184320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2546217441558838, "created_at": "2025-06-03T08:56:35.488260+00:00"} {"global_step": 236291, "acc_step": 0, "speed/wps": 5525.383719628086, "speed/FLOPS": 244193678929906.28, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04924260824918747, "optim/lr": 9.612980006065807e-06, "optim/total_tokens": 1982152572928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.276232123374939, "created_at": "2025-06-03T08:56:38.461252+00:00"} {"global_step": 236292, "acc_step": 0, "speed/wps": 5516.897398154265, "speed/FLOPS": 243818626957694.38, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04697142913937569, "optim/lr": 9.609432780971261e-06, "optim/total_tokens": 1982160961536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.269815444946289, "created_at": "2025-06-03T08:56:41.435405+00:00"} {"global_step": 236293, "acc_step": 0, "speed/wps": 5523.230180071339, "speed/FLOPS": 244098503504312.78, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04593568667769432, "optim/lr": 9.605885555876715e-06, "optim/total_tokens": 1982169350144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2553765773773193, "created_at": "2025-06-03T08:56:44.406143+00:00"} {"global_step": 236294, "acc_step": 0, "speed/wps": 5513.669536574363, "speed/FLOPS": 243675971997555.97, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.049887847155332565, "optim/lr": 9.60233833078239e-06, "optim/total_tokens": 1982177738752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2567025423049927, "created_at": "2025-06-03T08:56:47.382117+00:00"} {"global_step": 236295, "acc_step": 0, "speed/wps": 5514.684053973148, "speed/FLOPS": 243720808473811.53, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04695578292012215, "optim/lr": 9.598791105687842e-06, "optim/total_tokens": 1982186127360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2552546262741089, "created_at": "2025-06-03T08:56:50.357270+00:00"} {"global_step": 236296, "acc_step": 0, "speed/wps": 5534.71679272398, "speed/FLOPS": 244606152989746.16, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04736701771616936, "optim/lr": 9.595243880593296e-06, "optim/total_tokens": 1982194515968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.268046498298645, "created_at": "2025-06-03T08:56:53.326731+00:00"} {"global_step": 236297, "acc_step": 0, "speed/wps": 5519.789484313072, "speed/FLOPS": 243946442362874.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.23 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.23, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047309618443250656, "optim/lr": 9.59169665549875e-06, "optim/total_tokens": 1982202904576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2761956453323364, "created_at": "2025-06-03T08:56:56.299142+00:00"} {"global_step": 236298, "acc_step": 0, "speed/wps": 5528.272106571245, "speed/FLOPS": 244321330848689.34, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04680817574262619, "optim/lr": 9.588149430404425e-06, "optim/total_tokens": 1982211293184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.26478910446167, "created_at": "2025-06-03T08:56:59.271258+00:00"} {"global_step": 236299, "acc_step": 0, "speed/wps": 5522.4934055142185, "speed/FLOPS": 244065941840042.1, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04705355688929558, "optim/lr": 9.584602205309878e-06, "optim/total_tokens": 1982219681792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2713209390640259, "created_at": "2025-06-03T08:57:02.243629+00:00"} {"global_step": 236300, "acc_step": 0, "speed/wps": 5523.476010090381, "speed/FLOPS": 244109367932882.34, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04951326176524162, "optim/lr": 9.581054980215332e-06, "optim/total_tokens": 1982228070400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2741317749023438, "created_at": "2025-06-03T08:57:05.214295+00:00"} {"global_step": 236301, "acc_step": 0, "speed/wps": 5532.761707629042, "speed/FLOPS": 244519748235582.56, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.32, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047131091356277466, "optim/lr": 9.577507755120784e-06, "optim/total_tokens": 1982236459008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2522777318954468, "created_at": "2025-06-03T08:57:08.181803+00:00"} {"global_step": 236302, "acc_step": 0, "speed/wps": 5519.10828581078, "speed/FLOPS": 243916336875763.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.051867228001356125, "optim/lr": 9.57396053002646e-06, "optim/total_tokens": 1982244847616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2552624940872192, "created_at": "2025-06-03T08:57:11.155338+00:00"} {"global_step": 236303, "acc_step": 0, "speed/wps": 5522.466414255014, "speed/FLOPS": 244064748964539.03, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04706186801195145, "optim/lr": 9.570413304931913e-06, "optim/total_tokens": 1982253236224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.260219693183899, "created_at": "2025-06-03T08:57:14.127284+00:00"} {"global_step": 236304, "acc_step": 0, "speed/wps": 5528.735987276127, "speed/FLOPS": 244341832001488.44, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04728235676884651, "optim/lr": 9.566866079837367e-06, "optim/total_tokens": 1982261624832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2621949911117554, "created_at": "2025-06-03T08:57:17.095259+00:00"} {"global_step": 236305, "acc_step": 0, "speed/wps": 5537.02074135829, "speed/FLOPS": 244707975726704.53, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.07, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04987102374434471, "optim/lr": 9.56331885474282e-06, "optim/total_tokens": 1982270013440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2777410745620728, "created_at": "2025-06-03T08:57:20.061329+00:00"} {"global_step": 236306, "acc_step": 0, "speed/wps": 5531.873854649887, "speed/FLOPS": 244480509678347.44, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04656529799103737, "optim/lr": 9.559771629648494e-06, "optim/total_tokens": 1982278402048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2711936235427856, "created_at": "2025-06-03T08:57:23.032375+00:00"} {"global_step": 236307, "acc_step": 0, "speed/wps": 5533.26996133957, "speed/FLOPS": 244542210448109.6, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.31, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05173473060131073, "optim/lr": 9.556224404553948e-06, "optim/total_tokens": 1982286790656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2565603256225586, "created_at": "2025-06-03T08:57:26.001128+00:00"} {"global_step": 236308, "acc_step": 0, "speed/wps": 5514.384773504948, "speed/FLOPS": 243707581808973.34, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04936552047729492, "optim/lr": 9.552677179459401e-06, "optim/total_tokens": 1982295179264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2720953226089478, "created_at": "2025-06-03T08:57:28.979168+00:00"} {"global_step": 236309, "acc_step": 0, "speed/wps": 5515.064046991537, "speed/FLOPS": 243737602220243.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047395311295986176, "optim/lr": 9.549129954364855e-06, "optim/total_tokens": 1982303567872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2770236730575562, "created_at": "2025-06-03T08:57:31.955347+00:00"} {"global_step": 236310, "acc_step": 0, "speed/wps": 5516.159713272348, "speed/FLOPS": 243786025061727.16, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0541912280023098, "optim/lr": 9.54558272927053e-06, "optim/total_tokens": 1982311956480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.267864465713501, "created_at": "2025-06-03T08:57:34.930589+00:00"} {"global_step": 236311, "acc_step": 0, "speed/wps": 5525.618802073085, "speed/FLOPS": 244204068370714.22, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.58, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04664747416973114, "optim/lr": 9.542035504175982e-06, "optim/total_tokens": 1982320345088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2785429954528809, "created_at": "2025-06-03T08:57:37.900682+00:00"} {"global_step": 236312, "acc_step": 0, "speed/wps": 5511.098564470352, "speed/FLOPS": 243562348189986.88, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0478353314101696, "optim/lr": 9.538488279081436e-06, "optim/total_tokens": 1982328733696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2597156763076782, "created_at": "2025-06-03T08:57:40.879697+00:00"} {"global_step": 236313, "acc_step": 0, "speed/wps": 5526.663096804061, "speed/FLOPS": 244250220852638.38, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04947764426469803, "optim/lr": 9.53494105398689e-06, "optim/total_tokens": 1982337122304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2768577337265015, "created_at": "2025-06-03T08:57:43.855420+00:00"} {"global_step": 236314, "acc_step": 0, "speed/wps": 5526.467852537709, "speed/FLOPS": 244241592055416.38, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04686186462640762, "optim/lr": 9.531393828892565e-06, "optim/total_tokens": 1982345510912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2582565546035767, "created_at": "2025-06-03T08:57:46.830536+00:00"} {"global_step": 236315, "acc_step": 0, "speed/wps": 5505.0351856194075, "speed/FLOPS": 243294377879961.47, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04776721075177193, "optim/lr": 9.527846603798019e-06, "optim/total_tokens": 1982353899520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2679588794708252, "created_at": "2025-06-03T08:57:49.812060+00:00"} {"global_step": 236316, "acc_step": 0, "speed/wps": 5521.014217818593, "speed/FLOPS": 244000569315064.44, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04803679883480072, "optim/lr": 9.52429937870347e-06, "optim/total_tokens": 1982362288128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2819621562957764, "created_at": "2025-06-03T08:57:52.788465+00:00"} {"global_step": 236317, "acc_step": 0, "speed/wps": 5512.72357813326, "speed/FLOPS": 243634165476313.47, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047176796942949295, "optim/lr": 9.520752153608924e-06, "optim/total_tokens": 1982370676736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2579621076583862, "created_at": "2025-06-03T08:57:55.766936+00:00"} {"global_step": 236318, "acc_step": 0, "speed/wps": 5504.664766456219, "speed/FLOPS": 243278007248925.7, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04990227892994881, "optim/lr": 9.5172049285146e-06, "optim/total_tokens": 1982379065344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2656811475753784, "created_at": "2025-06-03T08:57:58.749910+00:00"} {"global_step": 236319, "acc_step": 0, "speed/wps": 5503.11053622003, "speed/FLOPS": 243209318227757.66, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.22 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.22, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047029271721839905, "optim/lr": 9.513657703420053e-06, "optim/total_tokens": 1982387453952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2609835863113403, "created_at": "2025-06-03T08:58:01.731924+00:00"} {"global_step": 236320, "acc_step": 0, "speed/wps": 5508.025039292482, "speed/FLOPS": 243426514108852.97, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047924723476171494, "optim/lr": 9.510110478325507e-06, "optim/total_tokens": 1982395842560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2605347633361816, "created_at": "2025-06-03T08:58:04.710970+00:00"} {"global_step": 236321, "acc_step": 0, "speed/wps": 5515.176286368286, "speed/FLOPS": 243742562626202.8, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04686029627919197, "optim/lr": 9.506563253231183e-06, "optim/total_tokens": 1982404231168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.258916974067688, "created_at": "2025-06-03T08:58:07.689891+00:00"} {"global_step": 236322, "acc_step": 0, "speed/wps": 5506.710860640153, "speed/FLOPS": 243368434138996.2, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04700969532132149, "optim/lr": 9.503016028136634e-06, "optim/total_tokens": 1982412619776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.265051245689392, "created_at": "2025-06-03T08:58:10.669960+00:00"} {"global_step": 236323, "acc_step": 0, "speed/wps": 5513.963577105476, "speed/FLOPS": 243688967083995.34, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046816226094961166, "optim/lr": 9.499468803042088e-06, "optim/total_tokens": 1982421008384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2758864164352417, "created_at": "2025-06-03T08:58:13.650111+00:00"} {"global_step": 236324, "acc_step": 0, "speed/wps": 5526.796586266366, "speed/FLOPS": 244256120403611.25, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04712168872356415, "optim/lr": 9.495921577947542e-06, "optim/total_tokens": 1982429396992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2653095722198486, "created_at": "2025-06-03T08:58:16.619444+00:00"} {"global_step": 236325, "acc_step": 0, "speed/wps": 5505.535155650095, "speed/FLOPS": 243316473996239.25, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046208519488573074, "optim/lr": 9.492374352853217e-06, "optim/total_tokens": 1982437785600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.265655755996704, "created_at": "2025-06-03T08:58:19.599625+00:00"} {"global_step": 236326, "acc_step": 0, "speed/wps": 5507.8867540305755, "speed/FLOPS": 243420402608084.84, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04654854163527489, "optim/lr": 9.48882712775867e-06, "optim/total_tokens": 1982446174208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2662222385406494, "created_at": "2025-06-03T08:58:22.579317+00:00"} {"global_step": 236327, "acc_step": 0, "speed/wps": 5506.4068210718215, "speed/FLOPS": 243354997146291.5, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04648350551724434, "optim/lr": 9.485279902664123e-06, "optim/total_tokens": 1982454562816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2762984037399292, "created_at": "2025-06-03T08:58:25.559913+00:00"} {"global_step": 236328, "acc_step": 0, "speed/wps": 5511.799531245535, "speed/FLOPS": 243593327333576.75, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.045913610607385635, "optim/lr": 9.481732677569576e-06, "optim/total_tokens": 1982462951424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.278335452079773, "created_at": "2025-06-03T08:58:28.541151+00:00"} {"global_step": 236329, "acc_step": 0, "speed/wps": 5502.6165192801645, "speed/FLOPS": 243187485207623.53, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.21 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.21, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04729744791984558, "optim/lr": 9.478185452475252e-06, "optim/total_tokens": 1982471340032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2681256532669067, "created_at": "2025-06-03T08:58:31.523728+00:00"} {"global_step": 236330, "acc_step": 0, "speed/wps": 5509.408837259647, "speed/FLOPS": 243487670896081.6, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047473110258579254, "optim/lr": 9.474638227380705e-06, "optim/total_tokens": 1982479728640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2436436414718628, "created_at": "2025-06-03T08:58:34.502151+00:00"} {"global_step": 236331, "acc_step": 0, "speed/wps": 5511.389844474961, "speed/FLOPS": 243575221275284.38, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046677928417921066, "optim/lr": 9.471091002286159e-06, "optim/total_tokens": 1982488117248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.251661777496338, "created_at": "2025-06-03T08:58:37.483184+00:00"} {"global_step": 236332, "acc_step": 0, "speed/wps": 5520.8379459603475, "speed/FLOPS": 243992779001171.12, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04774762690067291, "optim/lr": 9.467543777191611e-06, "optim/total_tokens": 1982496505856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.267103672027588, "created_at": "2025-06-03T08:58:40.455691+00:00"} {"global_step": 236333, "acc_step": 0, "speed/wps": 5518.63366720063, "speed/FLOPS": 243895361162513.1, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04675142467021942, "optim/lr": 9.463996552097287e-06, "optim/total_tokens": 1982504894464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2620570659637451, "created_at": "2025-06-03T08:58:43.431679+00:00"} {"global_step": 236334, "acc_step": 0, "speed/wps": 5525.174554105647, "speed/FLOPS": 244184434884420.7, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04691484570503235, "optim/lr": 9.46044932700274e-06, "optim/total_tokens": 1982513283072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2789324522018433, "created_at": "2025-06-03T08:58:46.405592+00:00"} {"global_step": 236335, "acc_step": 0, "speed/wps": 5526.786688885619, "speed/FLOPS": 244255682990041.62, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.051859259605407715, "optim/lr": 9.456902101908194e-06, "optim/total_tokens": 1982521671680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2818281650543213, "created_at": "2025-06-03T08:58:49.376013+00:00"} {"global_step": 236336, "acc_step": 0, "speed/wps": 5511.446296769982, "speed/FLOPS": 243577716177775.25, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04670105129480362, "optim/lr": 9.453354876813647e-06, "optim/total_tokens": 1982530060288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2521153688430786, "created_at": "2025-06-03T08:58:52.356774+00:00"} {"global_step": 236337, "acc_step": 0, "speed/wps": 5519.088762985628, "speed/FLOPS": 243915474066818.6, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.2 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.2, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04684309661388397, "optim/lr": 9.449807651719323e-06, "optim/total_tokens": 1982538448896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2673009634017944, "created_at": "2025-06-03T08:58:55.330240+00:00"} {"global_step": 236338, "acc_step": 0, "speed/wps": 5524.47094089521, "speed/FLOPS": 244153338781938.28, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05017952620983124, "optim/lr": 9.446260426624775e-06, "optim/total_tokens": 1982546837504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2700984477996826, "created_at": "2025-06-03T08:58:58.302461+00:00"} {"global_step": 236339, "acc_step": 0, "speed/wps": 5527.442395673765, "speed/FLOPS": 244284661873866.06, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04858936741948128, "optim/lr": 9.442713201530228e-06, "optim/total_tokens": 1982555226112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2772279977798462, "created_at": "2025-06-03T08:59:01.274445+00:00"} {"global_step": 236340, "acc_step": 0, "speed/wps": 5539.534744131837, "speed/FLOPS": 244819081781462.62, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04853852838277817, "optim/lr": 9.439165976435682e-06, "optim/total_tokens": 1982563614720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2540210485458374, "created_at": "2025-06-03T08:59:04.238966+00:00"} {"global_step": 236341, "acc_step": 0, "speed/wps": 5525.028816104109, "speed/FLOPS": 244177994010707.44, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0466887541115284, "optim/lr": 9.435618751341358e-06, "optim/total_tokens": 1982572003328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.278153419494629, "created_at": "2025-06-03T08:59:07.210971+00:00"} {"global_step": 236342, "acc_step": 0, "speed/wps": 5532.699373741458, "speed/FLOPS": 244516993396805.12, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.25, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.056180231273174286, "optim/lr": 9.432071526246811e-06, "optim/total_tokens": 1982580391936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2762686014175415, "created_at": "2025-06-03T08:59:10.181426+00:00"} {"global_step": 236343, "acc_step": 0, "speed/wps": 5518.098204541225, "speed/FLOPS": 243871696453713.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05308045074343681, "optim/lr": 9.428524301152263e-06, "optim/total_tokens": 1982588780544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2713220119476318, "created_at": "2025-06-03T08:59:13.155132+00:00"} {"global_step": 236344, "acc_step": 0, "speed/wps": 5513.737918499726, "speed/FLOPS": 243678994128646.62, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046224843710660934, "optim/lr": 9.424977076057717e-06, "optim/total_tokens": 1982597169152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.239024043083191, "created_at": "2025-06-03T08:59:16.135050+00:00"} {"global_step": 236345, "acc_step": 0, "speed/wps": 5512.7777709587435, "speed/FLOPS": 243636560521815.8, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04688796028494835, "optim/lr": 9.421429850963392e-06, "optim/total_tokens": 1982605557760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2644309997558594, "created_at": "2025-06-03T08:59:19.113048+00:00"} {"global_step": 236346, "acc_step": 0, "speed/wps": 5505.407309910325, "speed/FLOPS": 243310823868915.25, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05294283851981163, "optim/lr": 9.417882625868846e-06, "optim/total_tokens": 1982613946368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.264866828918457, "created_at": "2025-06-03T08:59:22.098897+00:00"} {"global_step": 236347, "acc_step": 0, "speed/wps": 5502.729741859644, "speed/FLOPS": 243192489066110.8, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04700198024511337, "optim/lr": 9.4143354007743e-06, "optim/total_tokens": 1982622334976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2716060876846313, "created_at": "2025-06-03T08:59:25.084639+00:00"} {"global_step": 236348, "acc_step": 0, "speed/wps": 5510.374846301434, "speed/FLOPS": 243530363551246.1, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04760972410440445, "optim/lr": 9.410788175679973e-06, "optim/total_tokens": 1982630723584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2586840391159058, "created_at": "2025-06-03T08:59:28.067469+00:00"} {"global_step": 236349, "acc_step": 0, "speed/wps": 5521.890686681074, "speed/FLOPS": 244039304752611.75, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05254543945193291, "optim/lr": 9.407240950585427e-06, "optim/total_tokens": 1982639112192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.246264100074768, "created_at": "2025-06-03T08:59:31.042173+00:00"} {"global_step": 236350, "acc_step": 0, "speed/wps": 5522.814694484366, "speed/FLOPS": 244080141168016.56, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046453434973955154, "optim/lr": 9.40369372549088e-06, "optim/total_tokens": 1982647500800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2620254755020142, "created_at": "2025-06-03T08:59:34.014429+00:00"} {"global_step": 236351, "acc_step": 0, "speed/wps": 5516.608338611282, "speed/FLOPS": 243805852005435.4, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05462366342544556, "optim/lr": 9.400146500396334e-06, "optim/total_tokens": 1982655889408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.261625051498413, "created_at": "2025-06-03T08:59:36.993437+00:00"} {"global_step": 236352, "acc_step": 0, "speed/wps": 5517.335574808958, "speed/FLOPS": 243837992123040.38, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04853062704205513, "optim/lr": 9.39659927530201e-06, "optim/total_tokens": 1982664278016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2735813856124878, "created_at": "2025-06-03T08:59:39.967807+00:00"} {"global_step": 236353, "acc_step": 0, "speed/wps": 5517.7495692193215, "speed/FLOPS": 243856288556962.94, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0463678278028965, "optim/lr": 9.393052050207463e-06, "optim/total_tokens": 1982672666624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2674758434295654, "created_at": "2025-06-03T08:59:42.942272+00:00"} {"global_step": 236354, "acc_step": 0, "speed/wps": 5506.180187283928, "speed/FLOPS": 243344981092883.47, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.19 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.19, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.054006725549697876, "optim/lr": 9.389504825112915e-06, "optim/total_tokens": 1982681055232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.250357747077942, "created_at": "2025-06-03T08:59:45.924195+00:00"} {"global_step": 236355, "acc_step": 0, "speed/wps": 5509.995330904172, "speed/FLOPS": 243513590913223.0, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05268045887351036, "optim/lr": 9.385957600018369e-06, "optim/total_tokens": 1982689443840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2592500448226929, "created_at": "2025-06-03T08:59:48.904772+00:00"} {"global_step": 236356, "acc_step": 0, "speed/wps": 5522.796698043964, "speed/FLOPS": 244079345817464.97, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.052337657660245895, "optim/lr": 9.382410374924044e-06, "optim/total_tokens": 1982697832448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.266648769378662, "created_at": "2025-06-03T08:59:51.876456+00:00"} {"global_step": 236357, "acc_step": 0, "speed/wps": 5526.886768182888, "speed/FLOPS": 244260105982728.62, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05037786439061165, "optim/lr": 9.378863149829498e-06, "optim/total_tokens": 1982706221056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2701570987701416, "created_at": "2025-06-03T08:59:54.846595+00:00"} {"global_step": 236358, "acc_step": 0, "speed/wps": 5527.6736351015425, "speed/FLOPS": 244294881472983.16, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04824243113398552, "optim/lr": 9.375315924734951e-06, "optim/total_tokens": 1982714609664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.266341209411621, "created_at": "2025-06-03T08:59:57.818657+00:00"} {"global_step": 236359, "acc_step": 0, "speed/wps": 5516.507758059949, "speed/FLOPS": 243801406859884.4, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04943389818072319, "optim/lr": 9.371768699640403e-06, "optim/total_tokens": 1982722998272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2791836261749268, "created_at": "2025-06-03T09:00:00.793526+00:00"} {"global_step": 236360, "acc_step": 0, "speed/wps": 5513.766429074583, "speed/FLOPS": 243680254150124.97, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05262910574674606, "optim/lr": 9.368221474546079e-06, "optim/total_tokens": 1982731386880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2655330896377563, "created_at": "2025-06-03T09:00:03.769741+00:00"} {"global_step": 236361, "acc_step": 0, "speed/wps": 5501.971976832301, "speed/FLOPS": 243158999730495.28, "speed/curr_iter_time": 2.977, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.977, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0505581796169281, "optim/lr": 9.364674249451532e-06, "optim/total_tokens": 1982739775488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2641700506210327, "created_at": "2025-06-03T09:00:06.752061+00:00"} {"global_step": 236362, "acc_step": 0, "speed/wps": 5501.713186554527, "speed/FLOPS": 243147562524826.4, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.049961745738983154, "optim/lr": 9.361127024356986e-06, "optim/total_tokens": 1982748164096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2863904237747192, "created_at": "2025-06-03T09:00:09.740338+00:00"} {"global_step": 236363, "acc_step": 0, "speed/wps": 5510.219803050757, "speed/FLOPS": 243523511433149.47, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05645406246185303, "optim/lr": 9.35757979926244e-06, "optim/total_tokens": 1982756552704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.260937213897705, "created_at": "2025-06-03T09:00:12.724716+00:00"} {"global_step": 236364, "acc_step": 0, "speed/wps": 5518.573435625748, "speed/FLOPS": 243892699235196.47, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04789154976606369, "optim/lr": 9.354032574168114e-06, "optim/total_tokens": 1982764941312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2737550735473633, "created_at": "2025-06-03T09:00:15.698417+00:00"} {"global_step": 236365, "acc_step": 0, "speed/wps": 5504.930330396577, "speed/FLOPS": 243289743815810.06, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05058024078607559, "optim/lr": 9.350485349073567e-06, "optim/total_tokens": 1982773329920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2608784437179565, "created_at": "2025-06-03T09:00:18.679465+00:00"} {"global_step": 236366, "acc_step": 0, "speed/wps": 5501.312421435052, "speed/FLOPS": 243129850757847.44, "speed/curr_iter_time": 2.9755, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9755, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.18 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.18, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05427122861146927, "optim/lr": 9.34693812397902e-06, "optim/total_tokens": 1982781718528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.254820466041565, "created_at": "2025-06-03T09:00:21.666851+00:00"} {"global_step": 236367, "acc_step": 0, "speed/wps": 5510.030309011419, "speed/FLOPS": 243515136766529.16, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047716300934553146, "optim/lr": 9.343390898884474e-06, "optim/total_tokens": 1982790107136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2565125226974487, "created_at": "2025-06-03T09:00:24.645713+00:00"} {"global_step": 236368, "acc_step": 0, "speed/wps": 5516.964564728436, "speed/FLOPS": 243821595376483.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05018042400479317, "optim/lr": 9.33984367379015e-06, "optim/total_tokens": 1982798495744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.262884497642517, "created_at": "2025-06-03T09:00:27.620301+00:00"} {"global_step": 236369, "acc_step": 0, "speed/wps": 5518.803046717334, "speed/FLOPS": 243902846870188.44, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.055910032242536545, "optim/lr": 9.336296448695602e-06, "optim/total_tokens": 1982806884352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.26265549659729, "created_at": "2025-06-03T09:00:30.593409+00:00"} {"global_step": 236370, "acc_step": 0, "speed/wps": 5502.8102983187655, "speed/FLOPS": 243196049249278.66, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04745727404952049, "optim/lr": 9.332749223601055e-06, "optim/total_tokens": 1982815272960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.257345199584961, "created_at": "2025-06-03T09:00:33.575407+00:00"} {"global_step": 236371, "acc_step": 0, "speed/wps": 5519.688501542433, "speed/FLOPS": 243941979441289.2, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05853800103068352, "optim/lr": 9.329201998506509e-06, "optim/total_tokens": 1982823661568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2782992124557495, "created_at": "2025-06-03T09:00:36.548767+00:00"} {"global_step": 236372, "acc_step": 0, "speed/wps": 5519.396413855787, "speed/FLOPS": 243929070660579.72, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05619882419705391, "optim/lr": 9.325654773412185e-06, "optim/total_tokens": 1982832050176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2494711875915527, "created_at": "2025-06-03T09:00:39.521562+00:00"} {"global_step": 236373, "acc_step": 0, "speed/wps": 5524.964867386984, "speed/FLOPS": 244175167804729.72, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046242568641901016, "optim/lr": 9.322107548317638e-06, "optim/total_tokens": 1982840438784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2556203603744507, "created_at": "2025-06-03T09:00:42.495061+00:00"} {"global_step": 236374, "acc_step": 0, "speed/wps": 5515.311241090887, "speed/FLOPS": 243748526934180.88, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.051629699766635895, "optim/lr": 9.31856032322309e-06, "optim/total_tokens": 1982848827392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2474802732467651, "created_at": "2025-06-03T09:00:45.473371+00:00"} {"global_step": 236375, "acc_step": 0, "speed/wps": 5519.68184606538, "speed/FLOPS": 243941685303269.28, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05273403972387314, "optim/lr": 9.315013098128766e-06, "optim/total_tokens": 1982857216000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.272246241569519, "created_at": "2025-06-03T09:00:48.448789+00:00"} {"global_step": 236376, "acc_step": 0, "speed/wps": 5504.179085370799, "speed/FLOPS": 243256542630891.28, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04695820063352585, "optim/lr": 9.31146587303422e-06, "optim/total_tokens": 1982865604608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2675143480300903, "created_at": "2025-06-03T09:00:51.432402+00:00"} {"global_step": 236377, "acc_step": 0, "speed/wps": 5521.638484001072, "speed/FLOPS": 244028158685046.03, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.049373745918273926, "optim/lr": 9.307918647939673e-06, "optim/total_tokens": 1982873993216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2588026523590088, "created_at": "2025-06-03T09:00:54.408788+00:00"} {"global_step": 236378, "acc_step": 0, "speed/wps": 5497.412702679524, "speed/FLOPS": 242957503149423.16, "speed/curr_iter_time": 2.9794, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9794, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.17 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.17, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05471258610486984, "optim/lr": 9.304371422845126e-06, "optim/total_tokens": 1982882381824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2831707000732422, "created_at": "2025-06-03T09:00:57.393996+00:00"} {"global_step": 236379, "acc_step": 0, "speed/wps": 5506.485071796856, "speed/FLOPS": 243358455427814.5, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.08057855069637299, "optim/lr": 9.300824197750802e-06, "optim/total_tokens": 1982890770432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.260487675666809, "created_at": "2025-06-03T09:01:00.373734+00:00"} {"global_step": 236380, "acc_step": 0, "speed/wps": 5529.472827883389, "speed/FLOPS": 244374396584837.3, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04996153339743614, "optim/lr": 9.297276972656254e-06, "optim/total_tokens": 1982899159040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2647521495819092, "created_at": "2025-06-03T09:01:03.344449+00:00"} {"global_step": 236381, "acc_step": 0, "speed/wps": 5519.385581459466, "speed/FLOPS": 243928591924107.6, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.053188078105449677, "optim/lr": 9.293729747561707e-06, "optim/total_tokens": 1982907547648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.266021966934204, "created_at": "2025-06-03T09:01:06.322890+00:00"} {"global_step": 236382, "acc_step": 0, "speed/wps": 5507.547009513359, "speed/FLOPS": 243405387639393.97, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04798628017306328, "optim/lr": 9.290182522467161e-06, "optim/total_tokens": 1982915936256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.264456033706665, "created_at": "2025-06-03T09:01:09.304218+00:00"} {"global_step": 236383, "acc_step": 0, "speed/wps": 5521.329373593616, "speed/FLOPS": 244014497587206.94, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04909289628267288, "optim/lr": 9.286635297372837e-06, "optim/total_tokens": 1982924324864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2559764385223389, "created_at": "2025-06-03T09:01:12.280917+00:00"} {"global_step": 236384, "acc_step": 0, "speed/wps": 5521.308294103254, "speed/FLOPS": 244013565981627.56, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05165183171629906, "optim/lr": 9.28308807227829e-06, "optim/total_tokens": 1982932713472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2444487810134888, "created_at": "2025-06-03T09:01:15.253098+00:00"} {"global_step": 236385, "acc_step": 0, "speed/wps": 5517.939791887308, "speed/FLOPS": 243864695425240.1, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04878005385398865, "optim/lr": 9.279540847183742e-06, "optim/total_tokens": 1982941102080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2663495540618896, "created_at": "2025-06-03T09:01:18.227279+00:00"} {"global_step": 236386, "acc_step": 0, "speed/wps": 5509.922137269178, "speed/FLOPS": 243510356129195.25, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04625382646918297, "optim/lr": 9.275993622089196e-06, "optim/total_tokens": 1982949490688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2582039833068848, "created_at": "2025-06-03T09:01:21.210482+00:00"} {"global_step": 236387, "acc_step": 0, "speed/wps": 5499.621943337459, "speed/FLOPS": 243055140278585.1, "speed/curr_iter_time": 2.9783, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9783, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05240932106971741, "optim/lr": 9.272446396994871e-06, "optim/total_tokens": 1982957879296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2574275732040405, "created_at": "2025-06-03T09:01:24.195058+00:00"} {"global_step": 236388, "acc_step": 0, "speed/wps": 5511.846996777202, "speed/FLOPS": 243595425067125.8, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.16 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.16, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04914556443691254, "optim/lr": 9.268899171900325e-06, "optim/total_tokens": 1982966267904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2405202388763428, "created_at": "2025-06-03T09:01:27.173889+00:00"} {"global_step": 236389, "acc_step": 0, "speed/wps": 5524.3158354735215, "speed/FLOPS": 244146483916201.16, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04830719903111458, "optim/lr": 9.265351946805778e-06, "optim/total_tokens": 1982974656512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2593632936477661, "created_at": "2025-06-03T09:01:30.146411+00:00"} {"global_step": 236390, "acc_step": 0, "speed/wps": 5526.329276799102, "speed/FLOPS": 244235467717064.88, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0575370192527771, "optim/lr": 9.26180472171123e-06, "optim/total_tokens": 1982983045120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2610836029052734, "created_at": "2025-06-03T09:01:33.119954+00:00"} {"global_step": 236391, "acc_step": 0, "speed/wps": 5527.301313730421, "speed/FLOPS": 244278426774093.1, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048284001648426056, "optim/lr": 9.258257496616906e-06, "optim/total_tokens": 1982991433728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2614531517028809, "created_at": "2025-06-03T09:01:36.091717+00:00"} {"global_step": 236392, "acc_step": 0, "speed/wps": 5517.529450118799, "speed/FLOPS": 243846560419391.56, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04793717339634895, "optim/lr": 9.25471027152236e-06, "optim/total_tokens": 1982999822336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2551811933517456, "created_at": "2025-06-03T09:01:39.065687+00:00"} {"global_step": 236393, "acc_step": 0, "speed/wps": 5523.515455291759, "speed/FLOPS": 244111111208884.4, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0490015484392643, "optim/lr": 9.251163046427813e-06, "optim/total_tokens": 1983008210944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 425, "loss/out": 1.2670178413391113, "created_at": "2025-06-03T09:01:42.036207+00:00"} {"global_step": 236394, "acc_step": 0, "speed/wps": 5513.905112134093, "speed/FLOPS": 243686383231511.03, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04805051162838936, "optim/lr": 9.247615821333267e-06, "optim/total_tokens": 1983016599552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.258194923400879, "created_at": "2025-06-03T09:01:45.012556+00:00"} {"global_step": 236395, "acc_step": 0, "speed/wps": 5515.363514888784, "speed/FLOPS": 243750837168486.4, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04542740434408188, "optim/lr": 9.244068596238942e-06, "optim/total_tokens": 1983024988160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.269494891166687, "created_at": "2025-06-03T09:01:47.988275+00:00"} {"global_step": 236396, "acc_step": 0, "speed/wps": 5504.858093782333, "speed/FLOPS": 243286551327200.97, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046882156282663345, "optim/lr": 9.240521371144394e-06, "optim/total_tokens": 1983033376768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2773222923278809, "created_at": "2025-06-03T09:01:50.969672+00:00"} {"global_step": 236397, "acc_step": 0, "speed/wps": 5521.272586962723, "speed/FLOPS": 244011987908781.8, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04933565855026245, "optim/lr": 9.236974146049848e-06, "optim/total_tokens": 1983041765376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2596684694290161, "created_at": "2025-06-03T09:01:53.941925+00:00"} {"global_step": 236398, "acc_step": 0, "speed/wps": 5529.543724072513, "speed/FLOPS": 244377529833517.0, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047240812331438065, "optim/lr": 9.233426920955301e-06, "optim/total_tokens": 1983050153984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2819370031356812, "created_at": "2025-06-03T09:01:56.910639+00:00"} {"global_step": 236399, "acc_step": 0, "speed/wps": 5525.379718615751, "speed/FLOPS": 244193502105640.12, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047354113310575485, "optim/lr": 9.229879695860977e-06, "optim/total_tokens": 1983058542592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2643227577209473, "created_at": "2025-06-03T09:01:59.881139+00:00"} {"global_step": 236400, "acc_step": 0, "speed/wps": 5525.249860233712, "speed/FLOPS": 244187763029829.44, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046747349202632904, "optim/lr": 9.22633247076643e-06, "optim/total_tokens": 1983066931200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2497966289520264, "created_at": "2025-06-03T09:02:02.852652+00:00"} {"global_step": 236401, "acc_step": 0, "speed/wps": 5522.24960355061, "speed/FLOPS": 244055167041142.2, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04798813909292221, "optim/lr": 9.222785245671882e-06, "optim/total_tokens": 1983075319808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2651900053024292, "created_at": "2025-06-03T09:02:05.824058+00:00"} {"global_step": 236402, "acc_step": 0, "speed/wps": 5501.7667837234685, "speed/FLOPS": 243149931245358.44, "speed/curr_iter_time": 2.9771, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9771, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.15 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.15, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04651929438114166, "optim/lr": 9.219238020577558e-06, "optim/total_tokens": 1983083708416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.256544589996338, "created_at": "2025-06-03T09:02:08.806352+00:00"} {"global_step": 236403, "acc_step": 0, "speed/wps": 5523.862864466464, "speed/FLOPS": 244126464916205.0, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047620274126529694, "optim/lr": 9.215690795483012e-06, "optim/total_tokens": 1983092097024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2732230424880981, "created_at": "2025-06-03T09:02:11.781454+00:00"} {"global_step": 236404, "acc_step": 0, "speed/wps": 5518.050131510001, "speed/FLOPS": 243869571871793.72, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04706050828099251, "optim/lr": 9.212143570388465e-06, "optim/total_tokens": 1983100485632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2789380550384521, "created_at": "2025-06-03T09:02:14.754910+00:00"} {"global_step": 236405, "acc_step": 0, "speed/wps": 5515.284016537542, "speed/FLOPS": 243747323748270.94, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04667140543460846, "optim/lr": 9.208596345293919e-06, "optim/total_tokens": 1983108874240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.25359308719635, "created_at": "2025-06-03T09:02:17.730903+00:00"} {"global_step": 236406, "acc_step": 0, "speed/wps": 5523.817718835212, "speed/FLOPS": 244124469710379.94, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048167385160923004, "optim/lr": 9.205049120199593e-06, "optim/total_tokens": 1983117262848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2608331441879272, "created_at": "2025-06-03T09:02:20.703180+00:00"} {"global_step": 236407, "acc_step": 0, "speed/wps": 5530.809918599042, "speed/FLOPS": 244433489150618.47, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.48, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046351656317710876, "optim/lr": 9.201501895105046e-06, "optim/total_tokens": 1983125651456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2638416290283203, "created_at": "2025-06-03T09:02:23.670010+00:00"} {"global_step": 236408, "acc_step": 0, "speed/wps": 5519.552450189872, "speed/FLOPS": 243935966667879.9, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04694918170571327, "optim/lr": 9.1979546700105e-06, "optim/total_tokens": 1983134040064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2628153562545776, "created_at": "2025-06-03T09:02:26.647808+00:00"} {"global_step": 236409, "acc_step": 0, "speed/wps": 5511.166735885752, "speed/FLOPS": 243565361017614.62, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04754285514354706, "optim/lr": 9.194407444915953e-06, "optim/total_tokens": 1983142428672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2467291355133057, "created_at": "2025-06-03T09:02:29.627733+00:00"} {"global_step": 236410, "acc_step": 0, "speed/wps": 5470.35810421281, "speed/FLOPS": 241761828375182.7, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04791911691427231, "optim/lr": 9.190860219821629e-06, "optim/total_tokens": 1983150817280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2644399404525757, "created_at": "2025-06-03T09:02:32.632009+00:00"} {"global_step": 236411, "acc_step": 0, "speed/wps": 5536.745024062307, "speed/FLOPS": 244695790433471.1, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04641295224428177, "optim/lr": 9.187312994727083e-06, "optim/total_tokens": 1983159205888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2865368127822876, "created_at": "2025-06-03T09:02:35.596403+00:00"} {"global_step": 236412, "acc_step": 0, "speed/wps": 5520.686080625161, "speed/FLOPS": 243986067330673.12, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05159669741988182, "optim/lr": 9.183765769632534e-06, "optim/total_tokens": 1983167594496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2618732452392578, "created_at": "2025-06-03T09:02:38.568995+00:00"} {"global_step": 236413, "acc_step": 0, "speed/wps": 5493.614885635014, "speed/FLOPS": 242789659075045.62, "speed/curr_iter_time": 2.9801, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9801, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.14 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.14, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04754231125116348, "optim/lr": 9.180218544537988e-06, "optim/total_tokens": 1983175983104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2634456157684326, "created_at": "2025-06-03T09:02:41.556122+00:00"} {"global_step": 236414, "acc_step": 0, "speed/wps": 5518.358187196517, "speed/FLOPS": 243883186356365.78, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04738938808441162, "optim/lr": 9.176671319443664e-06, "optim/total_tokens": 1983184371712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2634658813476562, "created_at": "2025-06-03T09:02:44.533486+00:00"} {"global_step": 236415, "acc_step": 0, "speed/wps": 5511.930922490083, "speed/FLOPS": 243599134154064.4, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04697217792272568, "optim/lr": 9.173124094349117e-06, "optim/total_tokens": 1983192760320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2750591039657593, "created_at": "2025-06-03T09:02:47.510833+00:00"} {"global_step": 236416, "acc_step": 0, "speed/wps": 5525.538896302948, "speed/FLOPS": 244200536944668.97, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.054145053029060364, "optim/lr": 9.16957686925457e-06, "optim/total_tokens": 1983201148928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2495465278625488, "created_at": "2025-06-03T09:02:50.484691+00:00"} {"global_step": 236417, "acc_step": 0, "speed/wps": 5523.179094425599, "speed/FLOPS": 244096245780251.1, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04621816799044609, "optim/lr": 9.166029644160023e-06, "optim/total_tokens": 1983209537536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2517690658569336, "created_at": "2025-06-03T09:02:53.455718+00:00"} {"global_step": 236418, "acc_step": 0, "speed/wps": 5520.2479328798745, "speed/FLOPS": 243966703442974.94, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04687602445483208, "optim/lr": 9.162482419065698e-06, "optim/total_tokens": 1983217926144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2452021837234497, "created_at": "2025-06-03T09:02:56.428494+00:00"} {"global_step": 236419, "acc_step": 0, "speed/wps": 5509.545134847722, "speed/FLOPS": 243493694551840.22, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04909728839993477, "optim/lr": 9.158935193971152e-06, "optim/total_tokens": 1983226314752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2537548542022705, "created_at": "2025-06-03T09:02:59.406906+00:00"} {"global_step": 236420, "acc_step": 0, "speed/wps": 5514.951608608021, "speed/FLOPS": 243732633019204.12, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04689035937190056, "optim/lr": 9.155387968876605e-06, "optim/total_tokens": 1983234703360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2683641910552979, "created_at": "2025-06-03T09:03:02.385741+00:00"} {"global_step": 236421, "acc_step": 0, "speed/wps": 5509.969134718847, "speed/FLOPS": 243512433175915.88, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047113072127103806, "optim/lr": 9.151840743782059e-06, "optim/total_tokens": 1983243091968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.248416543006897, "created_at": "2025-06-03T09:03:05.366653+00:00"} {"global_step": 236422, "acc_step": 0, "speed/wps": 5532.599408331436, "speed/FLOPS": 244512575437351.53, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04682055860757828, "optim/lr": 9.148293518687733e-06, "optim/total_tokens": 1983251480576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2555826902389526, "created_at": "2025-06-03T09:03:08.336060+00:00"} {"global_step": 236423, "acc_step": 0, "speed/wps": 5530.64479881307, "speed/FLOPS": 244426191701238.2, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048811983317136765, "optim/lr": 9.144746293593186e-06, "optim/total_tokens": 1983259869184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2558581829071045, "created_at": "2025-06-03T09:03:11.306004+00:00"} {"global_step": 236424, "acc_step": 0, "speed/wps": 5524.001098417727, "speed/FLOPS": 244132574149305.3, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04625092074275017, "optim/lr": 9.14119906849864e-06, "optim/total_tokens": 1983268257792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2612178325653076, "created_at": "2025-06-03T09:03:14.276688+00:00"} {"global_step": 236425, "acc_step": 0, "speed/wps": 5520.910551893211, "speed/FLOPS": 243995987811772.84, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047647539526224136, "optim/lr": 9.137651843404094e-06, "optim/total_tokens": 1983276646400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2651526927947998, "created_at": "2025-06-03T09:03:17.253137+00:00"} {"global_step": 236426, "acc_step": 0, "speed/wps": 5524.685295393749, "speed/FLOPS": 244162812153607.88, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048060011118650436, "optim/lr": 9.13410461830977e-06, "optim/total_tokens": 1983285035008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2818334102630615, "created_at": "2025-06-03T09:03:20.223961+00:00"} {"global_step": 236427, "acc_step": 0, "speed/wps": 5508.0337240642275, "speed/FLOPS": 243426897931311.44, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.13 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.13, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04685039073228836, "optim/lr": 9.130557393215221e-06, "optim/total_tokens": 1983293423616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2522165775299072, "created_at": "2025-06-03T09:03:23.203078+00:00"} {"global_step": 236428, "acc_step": 0, "speed/wps": 5519.5032919980085, "speed/FLOPS": 243933794127414.0, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04641915112733841, "optim/lr": 9.127010168120675e-06, "optim/total_tokens": 1983301812224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.265778660774231, "created_at": "2025-06-03T09:03:26.180131+00:00"} {"global_step": 236429, "acc_step": 0, "speed/wps": 5518.217020325345, "speed/FLOPS": 243876947503217.53, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04766371101140976, "optim/lr": 9.12346294302635e-06, "optim/total_tokens": 1983310200832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2572346925735474, "created_at": "2025-06-03T09:03:29.156307+00:00"} {"global_step": 236430, "acc_step": 0, "speed/wps": 5510.097705420713, "speed/FLOPS": 243518115342853.84, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04716785252094269, "optim/lr": 9.119915717931804e-06, "optim/total_tokens": 1983318589440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2644864320755005, "created_at": "2025-06-03T09:03:32.134443+00:00"} {"global_step": 236431, "acc_step": 0, "speed/wps": 5527.596207372224, "speed/FLOPS": 244291459563658.3, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04721645638346672, "optim/lr": 9.116368492837257e-06, "optim/total_tokens": 1983326978048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.262091040611267, "created_at": "2025-06-03T09:03:35.103191+00:00"} {"global_step": 236432, "acc_step": 0, "speed/wps": 5526.3936702864185, "speed/FLOPS": 244238313579608.5, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047437701374292374, "optim/lr": 9.112821267742711e-06, "optim/total_tokens": 1983335366656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2456564903259277, "created_at": "2025-06-03T09:03:38.071955+00:00"} {"global_step": 236433, "acc_step": 0, "speed/wps": 5516.1206830923165, "speed/FLOPS": 243784300127544.3, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047341685742139816, "optim/lr": 9.109274042648385e-06, "optim/total_tokens": 1983343755264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.250117540359497, "created_at": "2025-06-03T09:03:41.046773+00:00"} {"global_step": 236434, "acc_step": 0, "speed/wps": 5524.528887180802, "speed/FLOPS": 244155899711165.44, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04744201898574829, "optim/lr": 9.105726817553839e-06, "optim/total_tokens": 1983352143872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2486757040023804, "created_at": "2025-06-03T09:03:44.022297+00:00"} {"global_step": 236435, "acc_step": 0, "speed/wps": 5513.498642532312, "speed/FLOPS": 243668419355612.34, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04688593000173569, "optim/lr": 9.102179592459292e-06, "optim/total_tokens": 1983360532480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2692844867706299, "created_at": "2025-06-03T09:03:46.999433+00:00"} {"global_step": 236436, "acc_step": 0, "speed/wps": 5518.705363834468, "speed/FLOPS": 243898529786752.1, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0467449352145195, "optim/lr": 9.098632367364746e-06, "optim/total_tokens": 1983368921088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2759267091751099, "created_at": "2025-06-03T09:03:49.976374+00:00"} {"global_step": 236437, "acc_step": 0, "speed/wps": 5505.312454051218, "speed/FLOPS": 243306631725459.03, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047220584005117416, "optim/lr": 9.095085142270421e-06, "optim/total_tokens": 1983377309696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2563862800598145, "created_at": "2025-06-03T09:03:52.960899+00:00"} {"global_step": 236438, "acc_step": 0, "speed/wps": 5499.1657697269675, "speed/FLOPS": 243034979739909.6, "speed/curr_iter_time": 2.9785, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9785, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.12 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.12, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04763359948992729, "optim/lr": 9.091537917175873e-06, "optim/total_tokens": 1983385698304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2728520631790161, "created_at": "2025-06-03T09:03:55.948598+00:00"} {"global_step": 236439, "acc_step": 0, "speed/wps": 5527.921317318257, "speed/FLOPS": 244305827759209.44, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0481179840862751, "optim/lr": 9.087990692081327e-06, "optim/total_tokens": 1983394086912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2666019201278687, "created_at": "2025-06-03T09:03:58.917005+00:00"} {"global_step": 236440, "acc_step": 0, "speed/wps": 5505.66841859093, "speed/FLOPS": 243322363536122.6, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04653945192694664, "optim/lr": 9.08444346698678e-06, "optim/total_tokens": 1983402475520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2678166627883911, "created_at": "2025-06-03T09:04:01.897164+00:00"} {"global_step": 236441, "acc_step": 0, "speed/wps": 5518.202441232338, "speed/FLOPS": 243876303181929.2, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04795515909790993, "optim/lr": 9.080896241892456e-06, "optim/total_tokens": 1983410864128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2567803859710693, "created_at": "2025-06-03T09:04:04.874189+00:00"} {"global_step": 236442, "acc_step": 0, "speed/wps": 5519.741833829559, "speed/FLOPS": 243944336455400.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04748248681426048, "optim/lr": 9.07734901679791e-06, "optim/total_tokens": 1983419252736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2712727785110474, "created_at": "2025-06-03T09:04:07.846730+00:00"} {"global_step": 236443, "acc_step": 0, "speed/wps": 5515.037899407768, "speed/FLOPS": 243736446630876.6, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04714393615722656, "optim/lr": 9.073801791703361e-06, "optim/total_tokens": 1983427641344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2654646635055542, "created_at": "2025-06-03T09:04:10.822309+00:00"} {"global_step": 236444, "acc_step": 0, "speed/wps": 5514.3888843598925, "speed/FLOPS": 243707763487720.66, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04776229336857796, "optim/lr": 9.070254566608815e-06, "optim/total_tokens": 1983436029952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.252131462097168, "created_at": "2025-06-03T09:04:13.798324+00:00"} {"global_step": 236445, "acc_step": 0, "speed/wps": 5505.232133557278, "speed/FLOPS": 243303081970744.44, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04813915863633156, "optim/lr": 9.06670734151449e-06, "optim/total_tokens": 1983444418560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2560625076293945, "created_at": "2025-06-03T09:04:16.779399+00:00"} {"global_step": 236446, "acc_step": 0, "speed/wps": 5513.147776248424, "speed/FLOPS": 243652912861760.9, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.11 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.11, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04730192944407463, "optim/lr": 9.063160116419944e-06, "optim/total_tokens": 1983452807168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2734975814819336, "created_at": "2025-06-03T09:04:19.755856+00:00"} {"global_step": 236447, "acc_step": 0, "speed/wps": 5516.005063376658, "speed/FLOPS": 243779190327907.56, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047026537358760834, "optim/lr": 9.059612891325398e-06, "optim/total_tokens": 1983461195776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2747424840927124, "created_at": "2025-06-03T09:04:22.734648+00:00"} {"global_step": 236448, "acc_step": 0, "speed/wps": 5525.528937910603, "speed/FLOPS": 244200096834699.03, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04647166654467583, "optim/lr": 9.05606566623085e-06, "optim/total_tokens": 1983469584384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2575695514678955, "created_at": "2025-06-03T09:04:25.704387+00:00"} {"global_step": 236449, "acc_step": 0, "speed/wps": 5513.964785156416, "speed/FLOPS": 243689020473663.5, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04795360937714577, "optim/lr": 9.052518441136525e-06, "optim/total_tokens": 1983477972992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2624685764312744, "created_at": "2025-06-03T09:04:28.685475+00:00"} {"global_step": 236450, "acc_step": 0, "speed/wps": 5521.549589768015, "speed/FLOPS": 244024230014946.8, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04711877182126045, "optim/lr": 9.048971216041979e-06, "optim/total_tokens": 1983486361600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2611172199249268, "created_at": "2025-06-03T09:04:31.661417+00:00"} {"global_step": 236451, "acc_step": 0, "speed/wps": 5522.096357491936, "speed/FLOPS": 244048394349733.22, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047801654785871506, "optim/lr": 9.045423990947432e-06, "optim/total_tokens": 1983494750208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2616344690322876, "created_at": "2025-06-03T09:04:34.636351+00:00"} {"global_step": 236452, "acc_step": 0, "speed/wps": 5509.276932603648, "speed/FLOPS": 243481841385435.66, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04675336182117462, "optim/lr": 9.041876765852886e-06, "optim/total_tokens": 1983503138816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2670828104019165, "created_at": "2025-06-03T09:04:37.615521+00:00"} {"global_step": 236453, "acc_step": 0, "speed/wps": 5514.639203459524, "speed/FLOPS": 243718826310675.06, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048002198338508606, "optim/lr": 9.038329540758562e-06, "optim/total_tokens": 1983511527424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.255987524986267, "created_at": "2025-06-03T09:04:40.594996+00:00"} {"global_step": 236454, "acc_step": 0, "speed/wps": 5510.155492958879, "speed/FLOPS": 243520669256257.34, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04693182185292244, "optim/lr": 9.034782315664013e-06, "optim/total_tokens": 1983519916032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.257505178451538, "created_at": "2025-06-03T09:04:43.573820+00:00"} {"global_step": 236455, "acc_step": 0, "speed/wps": 5505.408066692564, "speed/FLOPS": 243310857314816.66, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04750867933034897, "optim/lr": 9.031235090569467e-06, "optim/total_tokens": 1983528304640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2712469100952148, "created_at": "2025-06-03T09:04:46.554997+00:00"} {"global_step": 236456, "acc_step": 0, "speed/wps": 5518.139492941589, "speed/FLOPS": 243873521189676.66, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0474475659430027, "optim/lr": 9.027687865475143e-06, "optim/total_tokens": 1983536693248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2803188562393188, "created_at": "2025-06-03T09:04:49.528790+00:00"} {"global_step": 236457, "acc_step": 0, "speed/wps": 5515.924651088847, "speed/FLOPS": 243775636516373.72, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.1 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.1, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04790881276130676, "optim/lr": 9.024140640380596e-06, "optim/total_tokens": 1983545081856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2548528909683228, "created_at": "2025-06-03T09:04:52.503932+00:00"} {"global_step": 236458, "acc_step": 0, "speed/wps": 5523.669283085673, "speed/FLOPS": 244117909610013.34, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04854351282119751, "optim/lr": 9.02059341528605e-06, "optim/total_tokens": 1983553470464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.268254280090332, "created_at": "2025-06-03T09:04:55.474337+00:00"} {"global_step": 236459, "acc_step": 0, "speed/wps": 5520.878187301979, "speed/FLOPS": 243994557462497.38, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04663559049367905, "optim/lr": 9.017046190191502e-06, "optim/total_tokens": 1983561859072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2603501081466675, "created_at": "2025-06-03T09:04:58.449388+00:00"} {"global_step": 236460, "acc_step": 0, "speed/wps": 5513.7753207602655, "speed/FLOPS": 243680647117120.34, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04626715928316116, "optim/lr": 9.013498965097177e-06, "optim/total_tokens": 1983570247680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.283206820487976, "created_at": "2025-06-03T09:05:01.427618+00:00"} {"global_step": 236461, "acc_step": 0, "speed/wps": 5522.477037714096, "speed/FLOPS": 244065218467054.66, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04975493252277374, "optim/lr": 9.009951740002631e-06, "optim/total_tokens": 1983578636288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2809723615646362, "created_at": "2025-06-03T09:05:04.399970+00:00"} {"global_step": 236462, "acc_step": 0, "speed/wps": 5516.764984602443, "speed/FLOPS": 243812774956457.84, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0463930107653141, "optim/lr": 9.006404514908084e-06, "optim/total_tokens": 1983587024896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2677966356277466, "created_at": "2025-06-03T09:05:07.377948+00:00"} {"global_step": 236463, "acc_step": 0, "speed/wps": 5521.257675911215, "speed/FLOPS": 244011328916626.84, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047260694205760956, "optim/lr": 9.002857289813538e-06, "optim/total_tokens": 1983595413504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2731637954711914, "created_at": "2025-06-03T09:05:10.349762+00:00"} {"global_step": 236464, "acc_step": 0, "speed/wps": 5513.746355598001, "speed/FLOPS": 243679367005205.4, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046755023300647736, "optim/lr": 8.999310064719214e-06, "optim/total_tokens": 1983603802112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2631908655166626, "created_at": "2025-06-03T09:05:13.325923+00:00"} {"global_step": 236465, "acc_step": 0, "speed/wps": 5518.663468402137, "speed/FLOPS": 243896678223083.34, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047619812190532684, "optim/lr": 8.995762839624666e-06, "optim/total_tokens": 1983612190720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2478504180908203, "created_at": "2025-06-03T09:05:16.299800+00:00"} {"global_step": 236466, "acc_step": 0, "speed/wps": 5519.579347597697, "speed/FLOPS": 243937155395632.38, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04606999456882477, "optim/lr": 8.992215614530119e-06, "optim/total_tokens": 1983620579328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.260025978088379, "created_at": "2025-06-03T09:05:19.275299+00:00"} {"global_step": 236467, "acc_step": 0, "speed/wps": 5523.3630030110735, "speed/FLOPS": 244104373598399.6, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04675943776965141, "optim/lr": 8.988668389435573e-06, "optim/total_tokens": 1983628967936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2648146152496338, "created_at": "2025-06-03T09:05:22.246370+00:00"} {"global_step": 236468, "acc_step": 0, "speed/wps": 5526.720493982378, "speed/FLOPS": 244252757514134.6, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047097399830818176, "optim/lr": 8.985121164341248e-06, "optim/total_tokens": 1983637356544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2674616575241089, "created_at": "2025-06-03T09:05:25.215546+00:00"} {"global_step": 236469, "acc_step": 0, "speed/wps": 5515.672965841556, "speed/FLOPS": 243764513316685.34, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.051163915544748306, "optim/lr": 8.981573939246702e-06, "optim/total_tokens": 1983645745152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2711788415908813, "created_at": "2025-06-03T09:05:28.190282+00:00"} {"global_step": 236470, "acc_step": 0, "speed/wps": 5508.324584022939, "speed/FLOPS": 243439752452730.28, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048396769911050797, "optim/lr": 8.978026714152154e-06, "optim/total_tokens": 1983654133760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.259751319885254, "created_at": "2025-06-03T09:05:31.168853+00:00"} {"global_step": 236471, "acc_step": 0, "speed/wps": 5509.643599795232, "speed/FLOPS": 243498046198530.88, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04778073728084564, "optim/lr": 8.974479489057607e-06, "optim/total_tokens": 1983662522368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2692238092422485, "created_at": "2025-06-03T09:05:34.147001+00:00"} {"global_step": 236472, "acc_step": 0, "speed/wps": 5513.804520391971, "speed/FLOPS": 243681937591384.47, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.09 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.09, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04676445201039314, "optim/lr": 8.970932263963283e-06, "optim/total_tokens": 1983670910976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2701377868652344, "created_at": "2025-06-03T09:05:37.123683+00:00"} {"global_step": 236473, "acc_step": 0, "speed/wps": 5528.927227996367, "speed/FLOPS": 244350283862464.3, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.6, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04747824743390083, "optim/lr": 8.967385038868737e-06, "optim/total_tokens": 1983679299584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2718256711959839, "created_at": "2025-06-03T09:05:40.091303+00:00"} {"global_step": 236474, "acc_step": 0, "speed/wps": 5518.712661841463, "speed/FLOPS": 243898852321306.7, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04703967645764351, "optim/lr": 8.96383781377419e-06, "optim/total_tokens": 1983687688192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2679803371429443, "created_at": "2025-06-03T09:05:43.065478+00:00"} {"global_step": 236475, "acc_step": 0, "speed/wps": 5513.323954344886, "speed/FLOPS": 243660699031863.3, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048028379678726196, "optim/lr": 8.960290588679642e-06, "optim/total_tokens": 1983696076800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.267944574356079, "created_at": "2025-06-03T09:05:46.041752+00:00"} {"global_step": 236476, "acc_step": 0, "speed/wps": 5524.741103861543, "speed/FLOPS": 244165278602230.75, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046237993985414505, "optim/lr": 8.956743363585318e-06, "optim/total_tokens": 1983704465408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.269948124885559, "created_at": "2025-06-03T09:05:49.012151+00:00"} {"global_step": 236477, "acc_step": 0, "speed/wps": 5511.131511568757, "speed/FLOPS": 243563804283097.8, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046967219561338425, "optim/lr": 8.953196138490771e-06, "optim/total_tokens": 1983712854016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2632282972335815, "created_at": "2025-06-03T09:05:51.989531+00:00"} {"global_step": 236478, "acc_step": 0, "speed/wps": 5510.724723168854, "speed/FLOPS": 243545826317953.9, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047306593507528305, "optim/lr": 8.949648913396225e-06, "optim/total_tokens": 1983721242624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2812559604644775, "created_at": "2025-06-03T09:05:54.967436+00:00"} {"global_step": 236479, "acc_step": 0, "speed/wps": 5510.7544105300485, "speed/FLOPS": 243547138347365.0, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047248151153326035, "optim/lr": 8.946101688301678e-06, "optim/total_tokens": 1983729631232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2483241558074951, "created_at": "2025-06-03T09:05:57.945206+00:00"} {"global_step": 236480, "acc_step": 0, "speed/wps": 5512.13316334733, "speed/FLOPS": 243608072164792.2, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04651961475610733, "optim/lr": 8.942554463207352e-06, "optim/total_tokens": 1983738019840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.283720850944519, "created_at": "2025-06-03T09:06:00.921565+00:00"} {"global_step": 236481, "acc_step": 0, "speed/wps": 5518.135879743763, "speed/FLOPS": 243873361504826.75, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047301486134529114, "optim/lr": 8.939007238112806e-06, "optim/total_tokens": 1983746408448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2619844675064087, "created_at": "2025-06-03T09:06:03.901248+00:00"} {"global_step": 236482, "acc_step": 0, "speed/wps": 5521.651443063125, "speed/FLOPS": 244028731409258.25, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04628446325659752, "optim/lr": 8.93546001301826e-06, "optim/total_tokens": 1983754797056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2726203203201294, "created_at": "2025-06-03T09:06:06.873555+00:00"} {"global_step": 236483, "acc_step": 0, "speed/wps": 5518.338950099565, "speed/FLOPS": 243882336175144.9, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04701783508062363, "optim/lr": 8.931912787923935e-06, "optim/total_tokens": 1983763185664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2579642534255981, "created_at": "2025-06-03T09:06:09.849111+00:00"} {"global_step": 236484, "acc_step": 0, "speed/wps": 5518.323447311839, "speed/FLOPS": 243881651031277.88, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04901948571205139, "optim/lr": 8.928365562829389e-06, "optim/total_tokens": 1983771574272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2734706401824951, "created_at": "2025-06-03T09:06:12.827267+00:00"} {"global_step": 236485, "acc_step": 0, "speed/wps": 5523.265060230699, "speed/FLOPS": 244100045028823.66, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04639666527509689, "optim/lr": 8.92481833773484e-06, "optim/total_tokens": 1983779962880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.272487998008728, "created_at": "2025-06-03T09:06:15.798173+00:00"} {"global_step": 236486, "acc_step": 0, "speed/wps": 5517.792146067991, "speed/FLOPS": 243858170235746.06, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047828253358602524, "optim/lr": 8.921271112640294e-06, "optim/total_tokens": 1983788351488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2512738704681396, "created_at": "2025-06-03T09:06:18.773433+00:00"} {"global_step": 236487, "acc_step": 0, "speed/wps": 5499.692858412225, "speed/FLOPS": 243058274361913.5, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04720481112599373, "optim/lr": 8.91772388754597e-06, "optim/total_tokens": 1983796740096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2628202438354492, "created_at": "2025-06-03T09:06:21.759058+00:00"} {"global_step": 236488, "acc_step": 0, "speed/wps": 5506.5634341957975, "speed/FLOPS": 243361918644752.6, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.08 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.08, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048247452825307846, "optim/lr": 8.914176662451423e-06, "optim/total_tokens": 1983805128704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2693318128585815, "created_at": "2025-06-03T09:06:24.742147+00:00"} {"global_step": 236489, "acc_step": 0, "speed/wps": 5511.298997808233, "speed/FLOPS": 243571206317610.4, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04845681041479111, "optim/lr": 8.910629437356877e-06, "optim/total_tokens": 1983813517312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2730646133422852, "created_at": "2025-06-03T09:06:27.719617+00:00"} {"global_step": 236490, "acc_step": 0, "speed/wps": 5513.624863701174, "speed/FLOPS": 243673997685217.53, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04678365960717201, "optim/lr": 8.90708221226233e-06, "optim/total_tokens": 1983821905920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.283576250076294, "created_at": "2025-06-03T09:06:30.698936+00:00"} {"global_step": 236491, "acc_step": 0, "speed/wps": 5525.568772129242, "speed/FLOPS": 244201857303272.8, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04703225940465927, "optim/lr": 8.903534987168004e-06, "optim/total_tokens": 1983830294528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2638970613479614, "created_at": "2025-06-03T09:06:33.671775+00:00"} {"global_step": 236492, "acc_step": 0, "speed/wps": 5517.4123640767975, "speed/FLOPS": 243841385815635.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.048177991062402725, "optim/lr": 8.899987762073458e-06, "optim/total_tokens": 1983838683136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2742998600006104, "created_at": "2025-06-03T09:06:36.646282+00:00"} {"global_step": 236493, "acc_step": 0, "speed/wps": 5524.03505121055, "speed/FLOPS": 244134074688961.94, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04718095064163208, "optim/lr": 8.896440536978911e-06, "optim/total_tokens": 1983847071744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2615119218826294, "created_at": "2025-06-03T09:06:39.616528+00:00"} {"global_step": 236494, "acc_step": 0, "speed/wps": 5520.083748410411, "speed/FLOPS": 243959447329796.97, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04743895307183266, "optim/lr": 8.892893311884365e-06, "optim/total_tokens": 1983855460352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26227867603302, "created_at": "2025-06-03T09:06:42.592038+00:00"} {"global_step": 236495, "acc_step": 0, "speed/wps": 5529.105156768541, "speed/FLOPS": 244358147403472.38, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04890378192067146, "optim/lr": 8.88934608679004e-06, "optim/total_tokens": 1983863848960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2724542617797852, "created_at": "2025-06-03T09:06:45.564393+00:00"} {"global_step": 236496, "acc_step": 0, "speed/wps": 5513.13724437149, "speed/FLOPS": 243652447406707.47, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.07 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.07, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04794635251164436, "optim/lr": 8.885798861695493e-06, "optim/total_tokens": 1983872237568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2716847658157349, "created_at": "2025-06-03T09:06:48.544440+00:00"} {"global_step": 236497, "acc_step": 0, "speed/wps": 5516.2187337236555, "speed/FLOPS": 243788633463580.88, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04776112362742424, "optim/lr": 8.882251636600946e-06, "optim/total_tokens": 1983880626176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2789844274520874, "created_at": "2025-06-03T09:06:51.519149+00:00"} {"global_step": 236498, "acc_step": 0, "speed/wps": 5527.258561785252, "speed/FLOPS": 244276537356940.94, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.049360912293195724, "optim/lr": 8.8787044115064e-06, "optim/total_tokens": 1983889014784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2579628229141235, "created_at": "2025-06-03T09:06:54.491659+00:00"} {"global_step": 236499, "acc_step": 0, "speed/wps": 5524.728649928447, "speed/FLOPS": 244164728202132.94, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04710351675748825, "optim/lr": 8.875157186412075e-06, "optim/total_tokens": 1983897403392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2719626426696777, "created_at": "2025-06-03T09:06:57.462098+00:00"} {"global_step": 236500, "acc_step": 0, "speed/wps": 5517.563330757811, "speed/FLOPS": 243848057770219.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04961981624364853, "optim/lr": 8.871609961317529e-06, "optim/total_tokens": 1983905792000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2601404190063477, "created_at": "2025-06-03T09:07:00.439767+00:00"} {"global_step": 236501, "acc_step": 0, "speed/wps": 5527.422548996254, "speed/FLOPS": 244283784752304.6, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047367699444293976, "optim/lr": 8.86806273622298e-06, "optim/total_tokens": 1983914180608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.277219533920288, "created_at": "2025-06-03T09:07:03.408695+00:00"} {"global_step": 236502, "acc_step": 0, "speed/wps": 5527.257146890906, "speed/FLOPS": 244276474825852.97, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046634968370199203, "optim/lr": 8.864515511128434e-06, "optim/total_tokens": 1983922569216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2595356702804565, "created_at": "2025-06-03T09:07:06.383267+00:00"} {"global_step": 236503, "acc_step": 0, "speed/wps": 5513.603459375995, "speed/FLOPS": 243673051723601.88, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04687320068478584, "optim/lr": 8.86096828603411e-06, "optim/total_tokens": 1983930957824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2525393962860107, "created_at": "2025-06-03T09:07:09.359465+00:00"} {"global_step": 236504, "acc_step": 0, "speed/wps": 5514.425399201799, "speed/FLOPS": 243709377256833.03, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.046549197286367416, "optim/lr": 8.857421060939564e-06, "optim/total_tokens": 1983939346432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.284078598022461, "created_at": "2025-06-03T09:07:12.339404+00:00"} {"global_step": 236505, "acc_step": 0, "speed/wps": 5509.386679741568, "speed/FLOPS": 243486691647194.94, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.06 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.06, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047298409044742584, "optim/lr": 8.853873835845017e-06, "optim/total_tokens": 1983947735040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2587709426879883, "created_at": "2025-06-03T09:07:15.321005+00:00"} {"global_step": 236506, "acc_step": 0, "speed/wps": 5528.661444406445, "speed/FLOPS": 244338537588193.5, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04850836098194122, "optim/lr": 8.850326610750469e-06, "optim/total_tokens": 1983956123648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2513123750686646, "created_at": "2025-06-03T09:07:18.294143+00:00"} {"global_step": 236507, "acc_step": 0, "speed/wps": 5519.354297969646, "speed/FLOPS": 243927209353980.94, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.0493302159011364, "optim/lr": 8.846779385656145e-06, "optim/total_tokens": 1983964512256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.247839331626892, "created_at": "2025-06-03T09:07:21.273234+00:00"} {"global_step": 236508, "acc_step": 0, "speed/wps": 5526.56657085361, "speed/FLOPS": 244245954899693.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.05069872364401817, "optim/lr": 8.843232160561598e-06, "optim/total_tokens": 1983972900864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.273031234741211, "created_at": "2025-06-03T09:07:24.242751+00:00"} {"global_step": 236509, "acc_step": 0, "speed/wps": 5519.386280615726, "speed/FLOPS": 243928622823235.66, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04711040481925011, "optim/lr": 8.839684935467052e-06, "optim/total_tokens": 1983981289472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.262436032295227, "created_at": "2025-06-03T09:07:27.216220+00:00"} {"global_step": 236510, "acc_step": 0, "speed/wps": 5526.69464550673, "speed/FLOPS": 244251615143815.44, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04905916005373001, "optim/lr": 8.836137710372727e-06, "optim/total_tokens": 1983989678080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2595840692520142, "created_at": "2025-06-03T09:07:30.185804+00:00"} {"global_step": 236511, "acc_step": 0, "speed/wps": 5518.585856197652, "speed/FLOPS": 243893248160900.38, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04670431464910507, "optim/lr": 8.832590485278181e-06, "optim/total_tokens": 1983998066688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2582569122314453, "created_at": "2025-06-03T09:07:33.159444+00:00"} {"global_step": 236512, "acc_step": 0, "speed/wps": 5512.196444461446, "speed/FLOPS": 243610868866134.0, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.051559168845415115, "optim/lr": 8.829043260183633e-06, "optim/total_tokens": 1984006455296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2523046731948853, "created_at": "2025-06-03T09:07:36.141091+00:00"} {"global_step": 236513, "acc_step": 0, "speed/wps": 5525.1394780331875, "speed/FLOPS": 244182884701553.6, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04794025421142578, "optim/lr": 8.825496035089086e-06, "optim/total_tokens": 1984014843904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2642560005187988, "created_at": "2025-06-03T09:07:39.112941+00:00"} {"global_step": 236514, "acc_step": 0, "speed/wps": 5526.393681570785, "speed/FLOPS": 244238314078319.75, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04781058430671692, "optim/lr": 8.821948809994762e-06, "optim/total_tokens": 1984023232512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.259758710861206, "created_at": "2025-06-03T09:07:42.082216+00:00"} {"global_step": 236515, "acc_step": 0, "speed/wps": 5535.291641660467, "speed/FLOPS": 244631558370395.28, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04698776453733444, "optim/lr": 8.818401584900216e-06, "optim/total_tokens": 1984031621120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.282594919204712, "created_at": "2025-06-03T09:07:45.046561+00:00"} {"global_step": 236516, "acc_step": 0, "speed/wps": 5527.336224488945, "speed/FLOPS": 244279969650930.44, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047293130308389664, "optim/lr": 8.81485435980567e-06, "optim/total_tokens": 1984040009728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.268897294998169, "created_at": "2025-06-03T09:07:48.018775+00:00"} {"global_step": 236517, "acc_step": 0, "speed/wps": 5523.337662819395, "speed/FLOPS": 244103253691630.25, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04614945873618126, "optim/lr": 8.811307134711121e-06, "optim/total_tokens": 1984048398336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2569888830184937, "created_at": "2025-06-03T09:07:50.991101+00:00"} {"global_step": 236518, "acc_step": 0, "speed/wps": 5526.080102043506, "speed/FLOPS": 244224455468259.53, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04690587520599365, "optim/lr": 8.807759909616797e-06, "optim/total_tokens": 1984056786944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.274297833442688, "created_at": "2025-06-03T09:07:53.964398+00:00"} {"global_step": 236519, "acc_step": 0, "speed/wps": 5518.669037688032, "speed/FLOPS": 243896924357013.72, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.05 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.05, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04892820119857788, "optim/lr": 8.80421268452225e-06, "optim/total_tokens": 1984065175552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2621641159057617, "created_at": "2025-06-03T09:07:56.940884+00:00"} {"global_step": 236520, "acc_step": 0, "speed/wps": 5519.875390964232, "speed/FLOPS": 243950238997145.9, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.047371163964271545, "optim/lr": 8.800665459427704e-06, "optim/total_tokens": 1984073564160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2751893997192383, "created_at": "2025-06-03T09:07:59.918180+00:00"} {"global_step": 236521, "acc_step": 0, "speed/wps": 5520.335680461291, "speed/FLOPS": 243970581436940.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04667651653289795, "optim/lr": 8.797118234333157e-06, "optim/total_tokens": 1984081952768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2795313596725464, "created_at": "2025-06-03T09:08:02.890271+00:00"} {"global_step": 236522, "acc_step": 0, "speed/wps": 5516.1410895165145, "speed/FLOPS": 243785201987044.34, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.09, "optim/grad_norm": 0.04733525589108467, "optim/lr": 8.793571009238833e-06, "optim/total_tokens": 1984090341376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2726726531982422, "created_at": "2025-06-03T09:08:05.864903+00:00"} {"global_step": 236523, "acc_step": 0, "speed/wps": 5536.273623422059, "speed/FLOPS": 244674956938019.38, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04661053791642189, "optim/lr": 8.790023784144285e-06, "optim/total_tokens": 1984098729984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2649922370910645, "created_at": "2025-06-03T09:08:08.829299+00:00"} {"global_step": 236524, "acc_step": 0, "speed/wps": 5524.095711259651, "speed/FLOPS": 244136755552645.94, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04634685441851616, "optim/lr": 8.786476559049738e-06, "optim/total_tokens": 1984107118592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2657651901245117, "created_at": "2025-06-03T09:08:11.800480+00:00"} {"global_step": 236525, "acc_step": 0, "speed/wps": 5531.394172699175, "speed/FLOPS": 244459310191360.78, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047499675303697586, "optim/lr": 8.782929333955192e-06, "optim/total_tokens": 1984115507200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2791802883148193, "created_at": "2025-06-03T09:08:14.766646+00:00"} {"global_step": 236526, "acc_step": 0, "speed/wps": 5527.39315285142, "speed/FLOPS": 244282485593166.06, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04661884158849716, "optim/lr": 8.779382108860868e-06, "optim/total_tokens": 1984123895808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2560840845108032, "created_at": "2025-06-03T09:08:17.737437+00:00"} {"global_step": 236527, "acc_step": 0, "speed/wps": 5514.087815559664, "speed/FLOPS": 243694457787760.34, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046800222247838974, "optim/lr": 8.775834883766321e-06, "optim/total_tokens": 1984132284416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2792081832885742, "created_at": "2025-06-03T09:08:20.716979+00:00"} {"global_step": 236528, "acc_step": 0, "speed/wps": 5536.782202829086, "speed/FLOPS": 244697433544664.56, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04679564759135246, "optim/lr": 8.772287658671773e-06, "optim/total_tokens": 1984140673024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2628068923950195, "created_at": "2025-06-03T09:08:23.680218+00:00"} {"global_step": 236529, "acc_step": 0, "speed/wps": 5522.890189874084, "speed/FLOPS": 244083477677821.7, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04687432572245598, "optim/lr": 8.768740433577227e-06, "optim/total_tokens": 1984149061632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2748496532440186, "created_at": "2025-06-03T09:08:26.651270+00:00"} {"global_step": 236530, "acc_step": 0, "speed/wps": 5511.3698327597795, "speed/FLOPS": 243574336859902.6, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04641563445329666, "optim/lr": 8.765193208482902e-06, "optim/total_tokens": 1984157450240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.255149006843567, "created_at": "2025-06-03T09:08:29.629904+00:00"} {"global_step": 236531, "acc_step": 0, "speed/wps": 5517.106723396017, "speed/FLOPS": 243827878061956.06, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046977389603853226, "optim/lr": 8.761645983388356e-06, "optim/total_tokens": 1984165838848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.266986608505249, "created_at": "2025-06-03T09:08:32.604465+00:00"} {"global_step": 236532, "acc_step": 0, "speed/wps": 5512.117943678496, "speed/FLOPS": 243607399533331.06, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.04 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.04, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04748391732573509, "optim/lr": 8.75809875829381e-06, "optim/total_tokens": 1984174227456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2608323097229004, "created_at": "2025-06-03T09:08:35.581464+00:00"} {"global_step": 236533, "acc_step": 0, "speed/wps": 5522.921954297363, "speed/FLOPS": 244084881502745.56, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04650900512933731, "optim/lr": 8.754551533199261e-06, "optim/total_tokens": 1984182616064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2650806903839111, "created_at": "2025-06-03T09:08:38.552621+00:00"} {"global_step": 236534, "acc_step": 0, "speed/wps": 5519.847401276827, "speed/FLOPS": 243949001996226.84, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047723907977342606, "optim/lr": 8.751004308104937e-06, "optim/total_tokens": 1984191004672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.263418197631836, "created_at": "2025-06-03T09:08:41.525038+00:00"} {"global_step": 236535, "acc_step": 0, "speed/wps": 5512.369349493732, "speed/FLOPS": 243618510383552.88, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048951052129268646, "optim/lr": 8.74745708301039e-06, "optim/total_tokens": 1984199393280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2726272344589233, "created_at": "2025-06-03T09:08:44.501167+00:00"} {"global_step": 236536, "acc_step": 0, "speed/wps": 5511.331309753882, "speed/FLOPS": 243572634340220.53, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04774266481399536, "optim/lr": 8.743909857915844e-06, "optim/total_tokens": 1984207781888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.26883864402771, "created_at": "2025-06-03T09:08:47.478282+00:00"} {"global_step": 236537, "acc_step": 0, "speed/wps": 5514.411655573738, "speed/FLOPS": 243708769858819.0, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04726358503103256, "optim/lr": 8.74036263282152e-06, "optim/total_tokens": 1984216170496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2529137134552002, "created_at": "2025-06-03T09:08:50.454764+00:00"} {"global_step": 236538, "acc_step": 0, "speed/wps": 5507.768340862579, "speed/FLOPS": 243415169352152.94, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048409223556518555, "optim/lr": 8.736815407726972e-06, "optim/total_tokens": 1984224559104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2619668245315552, "created_at": "2025-06-03T09:08:53.434320+00:00"} {"global_step": 236539, "acc_step": 0, "speed/wps": 5512.09137152729, "speed/FLOPS": 243606225180256.34, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0489719919860363, "optim/lr": 8.733268182632425e-06, "optim/total_tokens": 1984232947712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.254802942276001, "created_at": "2025-06-03T09:08:56.411950+00:00"} {"global_step": 236540, "acc_step": 0, "speed/wps": 5538.732034746764, "speed/FLOPS": 244783606135281.47, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04820239543914795, "optim/lr": 8.729720957537879e-06, "optim/total_tokens": 1984241336320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2568594217300415, "created_at": "2025-06-03T09:08:59.376175+00:00"} {"global_step": 236541, "acc_step": 0, "speed/wps": 5521.034956322375, "speed/FLOPS": 244001485850782.3, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04718143492937088, "optim/lr": 8.726173732443554e-06, "optim/total_tokens": 1984249724928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2484157085418701, "created_at": "2025-06-03T09:09:02.351644+00:00"} {"global_step": 236542, "acc_step": 0, "speed/wps": 5536.856708242025, "speed/FLOPS": 244700726302563.22, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04696549475193024, "optim/lr": 8.722626507349008e-06, "optim/total_tokens": 1984258113536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2617921829223633, "created_at": "2025-06-03T09:09:05.315358+00:00"} {"global_step": 236543, "acc_step": 0, "speed/wps": 5520.4547688850025, "speed/FLOPS": 243975844535718.94, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04704667255282402, "optim/lr": 8.719079282254462e-06, "optim/total_tokens": 1984266502144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2362890243530273, "created_at": "2025-06-03T09:09:08.287571+00:00"} {"global_step": 236544, "acc_step": 0, "speed/wps": 5529.885323574534, "speed/FLOPS": 244392626783041.53, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04793005809187889, "optim/lr": 8.715532057159913e-06, "optim/total_tokens": 1984274890752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2728432416915894, "created_at": "2025-06-03T09:09:11.257019+00:00"} {"global_step": 236545, "acc_step": 0, "speed/wps": 5529.8516516885065, "speed/FLOPS": 244391138658027.47, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0467328280210495, "optim/lr": 8.711984832065589e-06, "optim/total_tokens": 1984283279360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2594819068908691, "created_at": "2025-06-03T09:09:14.226417+00:00"} {"global_step": 236546, "acc_step": 0, "speed/wps": 5518.114395810478, "speed/FLOPS": 243872412024940.28, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04877427965402603, "optim/lr": 8.708437606971043e-06, "optim/total_tokens": 1984291667968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2608814239501953, "created_at": "2025-06-03T09:09:17.200925+00:00"} {"global_step": 236547, "acc_step": 0, "speed/wps": 5502.254310354706, "speed/FLOPS": 243171477427071.6, "speed/curr_iter_time": 2.9768, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9768, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "2.03 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 2.03, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04676925390958786, "optim/lr": 8.704890381876496e-06, "optim/total_tokens": 1984300056576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2719217538833618, "created_at": "2025-06-03T09:09:20.187075+00:00"} {"global_step": 236548, "acc_step": 0, "speed/wps": 5518.980975028776, "speed/FLOPS": 243910710390834.53, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04778289049863815, "optim/lr": 8.70134315678195e-06, "optim/total_tokens": 1984308445184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2663159370422363, "created_at": "2025-06-03T09:09:23.160898+00:00"} {"global_step": 236549, "acc_step": 0, "speed/wps": 5518.71370664134, "speed/FLOPS": 243898898496113.47, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047458112239837646, "optim/lr": 8.697795931687624e-06, "optim/total_tokens": 1984316833792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2513900995254517, "created_at": "2025-06-03T09:09:26.134403+00:00"} {"global_step": 236550, "acc_step": 0, "speed/wps": 5528.279791683095, "speed/FLOPS": 244321670491297.16, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04637472704052925, "optim/lr": 8.694248706593077e-06, "optim/total_tokens": 1984325222400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2482572793960571, "created_at": "2025-06-03T09:09:29.102548+00:00"} {"global_step": 236551, "acc_step": 0, "speed/wps": 5519.509273832893, "speed/FLOPS": 243934058493898.1, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.02 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.02, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04723067954182625, "optim/lr": 8.69070148149853e-06, "optim/total_tokens": 1984333611008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2613117694854736, "created_at": "2025-06-03T09:09:32.075832+00:00"} {"global_step": 236552, "acc_step": 0, "speed/wps": 5530.873585801006, "speed/FLOPS": 244436302915067.0, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04874265193939209, "optim/lr": 8.687154256403984e-06, "optim/total_tokens": 1984341999616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.25826895236969, "created_at": "2025-06-03T09:09:35.042803+00:00"} {"global_step": 236553, "acc_step": 0, "speed/wps": 5532.079061213614, "speed/FLOPS": 244489578758121.78, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04652557894587517, "optim/lr": 8.68360703130966e-06, "optim/total_tokens": 1984350388224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.25630521774292, "created_at": "2025-06-03T09:09:38.008850+00:00"} {"global_step": 236554, "acc_step": 0, "speed/wps": 5520.715622900695, "speed/FLOPS": 243987372948040.66, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0496787391602993, "optim/lr": 8.680059806215112e-06, "optim/total_tokens": 1984358776832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.266335129737854, "created_at": "2025-06-03T09:09:40.980886+00:00"} {"global_step": 236555, "acc_step": 0, "speed/wps": 5521.447297894895, "speed/FLOPS": 244019709237732.2, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04833480715751648, "optim/lr": 8.676512581120565e-06, "optim/total_tokens": 1984367165440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2700834274291992, "created_at": "2025-06-03T09:09:43.953837+00:00"} {"global_step": 236556, "acc_step": 0, "speed/wps": 5522.905942000112, "speed/FLOPS": 244084173841165.44, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04709123447537422, "optim/lr": 8.672965356026019e-06, "optim/total_tokens": 1984375554048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2691882848739624, "created_at": "2025-06-03T09:09:46.926031+00:00"} {"global_step": 236557, "acc_step": 0, "speed/wps": 5529.953221354071, "speed/FLOPS": 244395627517364.75, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05152837187051773, "optim/lr": 8.669418130931695e-06, "optim/total_tokens": 1984383942656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2560063600540161, "created_at": "2025-06-03T09:09:49.898096+00:00"} {"global_step": 236558, "acc_step": 0, "speed/wps": 5532.5246825156, "speed/FLOPS": 244509272938772.97, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.44, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047731444239616394, "optim/lr": 8.665870905837148e-06, "optim/total_tokens": 1984392331264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2709054946899414, "created_at": "2025-06-03T09:09:52.866136+00:00"} {"global_step": 236559, "acc_step": 0, "speed/wps": 5524.211141754608, "speed/FLOPS": 244141856989696.22, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05184345692396164, "optim/lr": 8.6623236807426e-06, "optim/total_tokens": 1984400719872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2540384531021118, "created_at": "2025-06-03T09:09:55.840511+00:00"} {"global_step": 236560, "acc_step": 0, "speed/wps": 5525.594479474002, "speed/FLOPS": 244202993436329.1, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05146591365337372, "optim/lr": 8.658776455648054e-06, "optim/total_tokens": 1984409108480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2500264644622803, "created_at": "2025-06-03T09:09:58.812065+00:00"} {"global_step": 236561, "acc_step": 0, "speed/wps": 5522.42066086377, "speed/FLOPS": 244062726898833.12, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05813673511147499, "optim/lr": 8.65522923055373e-06, "optim/total_tokens": 1984417497088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.274451494216919, "created_at": "2025-06-03T09:10:01.787476+00:00"} {"global_step": 236562, "acc_step": 0, "speed/wps": 5514.938574649944, "speed/FLOPS": 243732056984970.97, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05009781941771507, "optim/lr": 8.651682005459183e-06, "optim/total_tokens": 1984425885696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2631529569625854, "created_at": "2025-06-03T09:10:04.763188+00:00"} {"global_step": 236563, "acc_step": 0, "speed/wps": 5529.567919378434, "speed/FLOPS": 244378599142195.9, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04636217653751373, "optim/lr": 8.648134780364636e-06, "optim/total_tokens": 1984434274304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2646057605743408, "created_at": "2025-06-03T09:10:07.733258+00:00"} {"global_step": 236564, "acc_step": 0, "speed/wps": 5514.435813273729, "speed/FLOPS": 243709837505508.25, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048055849969387054, "optim/lr": 8.644587555270312e-06, "optim/total_tokens": 1984442662912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2626171112060547, "created_at": "2025-06-03T09:10:10.708779+00:00"} {"global_step": 236565, "acc_step": 0, "speed/wps": 5525.041077481167, "speed/FLOPS": 244178535900813.97, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04685356095433235, "optim/lr": 8.641040330175764e-06, "optim/total_tokens": 1984451051520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2619097232818604, "created_at": "2025-06-03T09:10:13.678748+00:00"} {"global_step": 236566, "acc_step": 0, "speed/wps": 5523.7537057935215, "speed/FLOPS": 244121640661585.7, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04712052270770073, "optim/lr": 8.637493105081218e-06, "optim/total_tokens": 1984459440128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.270803689956665, "created_at": "2025-06-03T09:10:16.649263+00:00"} {"global_step": 236567, "acc_step": 0, "speed/wps": 5525.551974340309, "speed/FLOPS": 244201114926980.88, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04702511057257652, "optim/lr": 8.633945879986671e-06, "optim/total_tokens": 1984467828736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.258301019668579, "created_at": "2025-06-03T09:10:19.623212+00:00"} {"global_step": 236568, "acc_step": 0, "speed/wps": 5520.969928752159, "speed/FLOPS": 243998611965020.03, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04671585187315941, "optim/lr": 8.630398654892347e-06, "optim/total_tokens": 1984476217344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2601572275161743, "created_at": "2025-06-03T09:10:22.596456+00:00"} {"global_step": 236569, "acc_step": 0, "speed/wps": 5528.349591891753, "speed/FLOPS": 244324755303250.0, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.050200533121824265, "optim/lr": 8.6268514297978e-06, "optim/total_tokens": 1984484605952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2592424154281616, "created_at": "2025-06-03T09:10:25.565028+00:00"} {"global_step": 236570, "acc_step": 0, "speed/wps": 5496.058559912148, "speed/FLOPS": 242897656970236.12, "speed/curr_iter_time": 2.9802, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9802, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "2.01 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 2.01, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04703289642930031, "optim/lr": 8.623304204703252e-06, "optim/total_tokens": 1984492994560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2429158687591553, "created_at": "2025-06-03T09:10:28.550515+00:00"} {"global_step": 236571, "acc_step": 0, "speed/wps": 5525.0921489903385, "speed/FLOPS": 244180793000111.7, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.050234355032444, "optim/lr": 8.619756979608706e-06, "optim/total_tokens": 1984501383168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.259373426437378, "created_at": "2025-06-03T09:10:31.520234+00:00"} {"global_step": 236572, "acc_step": 0, "speed/wps": 5515.004697252513, "speed/FLOPS": 243734979265558.38, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046310827136039734, "optim/lr": 8.616209754514381e-06, "optim/total_tokens": 1984509771776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2559592723846436, "created_at": "2025-06-03T09:10:34.496029+00:00"} {"global_step": 236573, "acc_step": 0, "speed/wps": 5521.159180518648, "speed/FLOPS": 244006975924420.5, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04651700705289841, "optim/lr": 8.612662529419835e-06, "optim/total_tokens": 1984518160384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2718987464904785, "created_at": "2025-06-03T09:10:37.468551+00:00"} {"global_step": 236574, "acc_step": 0, "speed/wps": 5532.7277405692475, "speed/FLOPS": 244518247065398.84, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.55, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.051522016525268555, "optim/lr": 8.609115304325289e-06, "optim/total_tokens": 1984526548992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2610262632369995, "created_at": "2025-06-03T09:10:40.434729+00:00"} {"global_step": 236575, "acc_step": 0, "speed/wps": 5524.18172034547, "speed/FLOPS": 244140556714004.75, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 194.76, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046124473214149475, "optim/lr": 8.60556807923074e-06, "optim/total_tokens": 1984534937600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.258309006690979, "created_at": "2025-06-03T09:10:43.405290+00:00"} {"global_step": 236576, "acc_step": 0, "speed/wps": 5536.9308645095025, "speed/FLOPS": 244704003630019.53, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.4, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04674132913351059, "optim/lr": 8.602020854136416e-06, "optim/total_tokens": 1984543326208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2631646394729614, "created_at": "2025-06-03T09:10:46.371679+00:00"} {"global_step": 236577, "acc_step": 0, "speed/wps": 5512.620486741989, "speed/FLOPS": 243629609364488.88, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048319604247808456, "optim/lr": 8.59847362904187e-06, "optim/total_tokens": 1984551714816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2567707300186157, "created_at": "2025-06-03T09:10:49.351498+00:00"} {"global_step": 236578, "acc_step": 0, "speed/wps": 5512.52027222141, "speed/FLOPS": 243625180395623.7, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "2.0 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 2.0, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04803149402141571, "optim/lr": 8.594926403947323e-06, "optim/total_tokens": 1984560103424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.263927698135376, "created_at": "2025-06-03T09:10:52.328683+00:00"} {"global_step": 236579, "acc_step": 0, "speed/wps": 5524.045689812159, "speed/FLOPS": 244134544860699.78, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04958786442875862, "optim/lr": 8.591379178852777e-06, "optim/total_tokens": 1984568492032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2862673997879028, "created_at": "2025-06-03T09:10:55.302990+00:00"} {"global_step": 236580, "acc_step": 0, "speed/wps": 5530.607932802479, "speed/FLOPS": 244424562412267.4, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049642421305179596, "optim/lr": 8.587831953758452e-06, "optim/total_tokens": 1984576880640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2689615488052368, "created_at": "2025-06-03T09:10:58.270077+00:00"} {"global_step": 236581, "acc_step": 0, "speed/wps": 5519.135368921868, "speed/FLOPS": 243917533810649.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047546256333589554, "optim/lr": 8.584284728663904e-06, "optim/total_tokens": 1984585269248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2552311420440674, "created_at": "2025-06-03T09:11:01.243040+00:00"} {"global_step": 236582, "acc_step": 0, "speed/wps": 5524.719858210727, "speed/FLOPS": 244164339653209.78, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04806525260210037, "optim/lr": 8.580737503569358e-06, "optim/total_tokens": 1984593657856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2505995035171509, "created_at": "2025-06-03T09:11:04.215042+00:00"} {"global_step": 236583, "acc_step": 0, "speed/wps": 5526.5019025015645, "speed/FLOPS": 244243096889535.25, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05139537900686264, "optim/lr": 8.577190278474811e-06, "optim/total_tokens": 1984602046464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2723612785339355, "created_at": "2025-06-03T09:11:07.183659+00:00"} {"global_step": 236584, "acc_step": 0, "speed/wps": 5521.08821283463, "speed/FLOPS": 244003839516032.44, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04749920964241028, "optim/lr": 8.573643053380487e-06, "optim/total_tokens": 1984610435072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2757185697555542, "created_at": "2025-06-03T09:11:10.156200+00:00"} {"global_step": 236585, "acc_step": 0, "speed/wps": 5527.584363642368, "speed/FLOPS": 244290936131420.4, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04779069870710373, "optim/lr": 8.57009582828594e-06, "optim/total_tokens": 1984618823680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2728453874588013, "created_at": "2025-06-03T09:11:13.124664+00:00"} {"global_step": 236586, "acc_step": 0, "speed/wps": 5512.230537711045, "speed/FLOPS": 243612375613261.22, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04951968416571617, "optim/lr": 8.566548603191392e-06, "optim/total_tokens": 1984627212288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.257338523864746, "created_at": "2025-06-03T09:11:16.101790+00:00"} {"global_step": 236587, "acc_step": 0, "speed/wps": 5509.818546215855, "speed/FLOPS": 243505777934865.47, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047175273299217224, "optim/lr": 8.563001378096846e-06, "optim/total_tokens": 1984635600896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2743889093399048, "created_at": "2025-06-03T09:11:19.079244+00:00"} {"global_step": 236588, "acc_step": 0, "speed/wps": 5518.041887634832, "speed/FLOPS": 243869207534707.22, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04770933464169502, "optim/lr": 8.559454153002522e-06, "optim/total_tokens": 1984643989504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2590532302856445, "created_at": "2025-06-03T09:11:22.052443+00:00"} {"global_step": 236589, "acc_step": 0, "speed/wps": 5500.19232407494, "speed/FLOPS": 243080348187708.5, "speed/curr_iter_time": 2.978, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.978, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049331799149513245, "optim/lr": 8.555906927907975e-06, "optim/total_tokens": 1984652378112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2700456380844116, "created_at": "2025-06-03T09:11:25.037271+00:00"} {"global_step": 236590, "acc_step": 0, "speed/wps": 5518.923260635922, "speed/FLOPS": 243908159710079.4, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.99 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.99, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04742831364274025, "optim/lr": 8.552359702813429e-06, "optim/total_tokens": 1984660766720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.25408935546875, "created_at": "2025-06-03T09:11:28.009735+00:00"} {"global_step": 236591, "acc_step": 0, "speed/wps": 5525.609924214996, "speed/FLOPS": 244203676014827.7, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05032984912395477, "optim/lr": 8.548812477719103e-06, "optim/total_tokens": 1984669155328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.270521640777588, "created_at": "2025-06-03T09:11:30.978877+00:00"} {"global_step": 236592, "acc_step": 0, "speed/wps": 5523.488145781444, "speed/FLOPS": 244109904268311.2, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04724852740764618, "optim/lr": 8.545265252624556e-06, "optim/total_tokens": 1984677543936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2720372676849365, "created_at": "2025-06-03T09:11:33.949735+00:00"} {"global_step": 236593, "acc_step": 0, "speed/wps": 5521.598529658932, "speed/FLOPS": 244026392907628.3, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046484075486660004, "optim/lr": 8.54171802753001e-06, "optim/total_tokens": 1984685932544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.277334213256836, "created_at": "2025-06-03T09:11:36.921194+00:00"} {"global_step": 236594, "acc_step": 0, "speed/wps": 5522.967725965427, "speed/FLOPS": 244086904376193.38, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04735667258501053, "optim/lr": 8.538170802435463e-06, "optim/total_tokens": 1984694321152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.279543161392212, "created_at": "2025-06-03T09:11:39.892267+00:00"} {"global_step": 236595, "acc_step": 0, "speed/wps": 5514.9505933263445, "speed/FLOPS": 243732588148950.72, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04710099846124649, "optim/lr": 8.534623577341139e-06, "optim/total_tokens": 1984702709760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2621796131134033, "created_at": "2025-06-03T09:11:42.868447+00:00"} {"global_step": 236596, "acc_step": 0, "speed/wps": 5528.751446543277, "speed/FLOPS": 244342515221968.75, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047329131513834, "optim/lr": 8.531076352246591e-06, "optim/total_tokens": 1984711098368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2660844326019287, "created_at": "2025-06-03T09:11:45.839968+00:00"} {"global_step": 236597, "acc_step": 0, "speed/wps": 5520.263433924028, "speed/FLOPS": 243967388509784.97, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04744860902428627, "optim/lr": 8.527529127152045e-06, "optim/total_tokens": 1984719486976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2666466236114502, "created_at": "2025-06-03T09:11:48.812749+00:00"} {"global_step": 236598, "acc_step": 0, "speed/wps": 5515.907287977205, "speed/FLOPS": 243774869155711.6, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.98 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.98, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04671241715550423, "optim/lr": 8.523981902057498e-06, "optim/total_tokens": 1984727875584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2695657014846802, "created_at": "2025-06-03T09:11:51.787693+00:00"} {"global_step": 236599, "acc_step": 0, "speed/wps": 5538.164058133458, "speed/FLOPS": 244758504476141.2, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.38, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04774245247244835, "optim/lr": 8.520434676963174e-06, "optim/total_tokens": 1984736264192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2567172050476074, "created_at": "2025-06-03T09:11:54.750093+00:00"} {"global_step": 236600, "acc_step": 0, "speed/wps": 5541.09123166845, "speed/FLOPS": 244887870563755.47, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.27, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04735874757170677, "optim/lr": 8.516887451868627e-06, "optim/total_tokens": 1984744652800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2591828107833862, "created_at": "2025-06-03T09:11:57.714492+00:00"} {"global_step": 236601, "acc_step": 0, "speed/wps": 5536.120472605018, "speed/FLOPS": 244668188455803.12, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04757479578256607, "optim/lr": 8.513340226774081e-06, "optim/total_tokens": 1984753041408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2710843086242676, "created_at": "2025-06-03T09:12:00.681327+00:00"} {"global_step": 236602, "acc_step": 0, "speed/wps": 5525.091282672519, "speed/FLOPS": 244180754713298.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04662551358342171, "optim/lr": 8.509793001679533e-06, "optim/total_tokens": 1984761430016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2527341842651367, "created_at": "2025-06-03T09:12:03.650654+00:00"} {"global_step": 236603, "acc_step": 0, "speed/wps": 5530.299547611326, "speed/FLOPS": 244410933365276.94, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0462416373193264, "optim/lr": 8.506245776585208e-06, "optim/total_tokens": 1984769818624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.266495943069458, "created_at": "2025-06-03T09:12:06.619965+00:00"} {"global_step": 236604, "acc_step": 0, "speed/wps": 5529.369545757403, "speed/FLOPS": 244369832043514.56, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046968843787908554, "optim/lr": 8.502698551490662e-06, "optim/total_tokens": 1984778207232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2608262300491333, "created_at": "2025-06-03T09:12:09.588256+00:00"} {"global_step": 236605, "acc_step": 0, "speed/wps": 5530.248474534563, "speed/FLOPS": 244408676196699.72, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046926308423280716, "optim/lr": 8.499151326396116e-06, "optim/total_tokens": 1984786595840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2691020965576172, "created_at": "2025-06-03T09:12:12.558336+00:00"} {"global_step": 236606, "acc_step": 0, "speed/wps": 5532.313259280261, "speed/FLOPS": 244499929113933.2, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04789497330784798, "optim/lr": 8.495604101301569e-06, "optim/total_tokens": 1984794984448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2702809572219849, "created_at": "2025-06-03T09:12:15.525338+00:00"} {"global_step": 236607, "acc_step": 0, "speed/wps": 5533.1628748279745, "speed/FLOPS": 244537477772415.53, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04695599153637886, "optim/lr": 8.492056876207243e-06, "optim/total_tokens": 1984803373056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2682732343673706, "created_at": "2025-06-03T09:12:18.490303+00:00"} {"global_step": 236608, "acc_step": 0, "speed/wps": 5540.49954949565, "speed/FLOPS": 244861721240221.62, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.23, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04639291390776634, "optim/lr": 8.488509651112697e-06, "optim/total_tokens": 1984811761664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.281567096710205, "created_at": "2025-06-03T09:12:21.457098+00:00"} {"global_step": 236609, "acc_step": 0, "speed/wps": 5517.727835624032, "speed/FLOPS": 243855328043293.78, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04849591106176376, "optim/lr": 8.48496242601815e-06, "optim/total_tokens": 1984820150272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2587754726409912, "created_at": "2025-06-03T09:12:24.431219+00:00"} {"global_step": 236610, "acc_step": 0, "speed/wps": 5524.933211764627, "speed/FLOPS": 244173768788249.7, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04700647294521332, "optim/lr": 8.481415200923604e-06, "optim/total_tokens": 1984828538880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2609825134277344, "created_at": "2025-06-03T09:12:27.402158+00:00"} {"global_step": 236611, "acc_step": 0, "speed/wps": 5521.876516275214, "speed/FLOPS": 244038678493203.47, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046393513679504395, "optim/lr": 8.47786797582928e-06, "optim/total_tokens": 1984836927488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.263354778289795, "created_at": "2025-06-03T09:12:30.377472+00:00"} {"global_step": 236612, "acc_step": 0, "speed/wps": 5522.317567474451, "speed/FLOPS": 244058170698705.03, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04683142527937889, "optim/lr": 8.474320750734731e-06, "optim/total_tokens": 1984845316096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.276736855506897, "created_at": "2025-06-03T09:12:33.351125+00:00"} {"global_step": 236613, "acc_step": 0, "speed/wps": 5525.736220189925, "speed/FLOPS": 244209257650478.16, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0483514778316021, "optim/lr": 8.470773525640185e-06, "optim/total_tokens": 1984853704704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.266128659248352, "created_at": "2025-06-03T09:12:36.321287+00:00"} {"global_step": 236614, "acc_step": 0, "speed/wps": 5517.478318890312, "speed/FLOPS": 243844300680805.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047763071954250336, "optim/lr": 8.467226300545638e-06, "optim/total_tokens": 1984862093312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2636667490005493, "created_at": "2025-06-03T09:12:39.298705+00:00"} {"global_step": 236615, "acc_step": 0, "speed/wps": 5512.821090398972, "speed/FLOPS": 243638475019344.9, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.97 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.97, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047315239906311035, "optim/lr": 8.463679075451314e-06, "optim/total_tokens": 1984870481920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2694263458251953, "created_at": "2025-06-03T09:12:42.281283+00:00"} {"global_step": 236616, "acc_step": 0, "speed/wps": 5534.156458508494, "speed/FLOPS": 244581389085472.22, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04653055965900421, "optim/lr": 8.460131850356768e-06, "optim/total_tokens": 1984878870528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2477961778640747, "created_at": "2025-06-03T09:12:45.247945+00:00"} {"global_step": 236617, "acc_step": 0, "speed/wps": 5527.052931269759, "speed/FLOPS": 244267449540668.56, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04637860506772995, "optim/lr": 8.45658462526222e-06, "optim/total_tokens": 1984887259136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2626347541809082, "created_at": "2025-06-03T09:12:48.220894+00:00"} {"global_step": 236618, "acc_step": 0, "speed/wps": 5520.908339780225, "speed/FLOPS": 243995890047701.5, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04625677317380905, "optim/lr": 8.453037400167673e-06, "optim/total_tokens": 1984895647744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2791780233383179, "created_at": "2025-06-03T09:12:51.193366+00:00"} {"global_step": 236619, "acc_step": 0, "speed/wps": 5531.910322662737, "speed/FLOPS": 244482121377855.2, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04714882746338844, "optim/lr": 8.449490175073349e-06, "optim/total_tokens": 1984904036352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2724313735961914, "created_at": "2025-06-03T09:12:54.159168+00:00"} {"global_step": 236620, "acc_step": 0, "speed/wps": 5520.5229467597555, "speed/FLOPS": 243978857648817.03, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04844576492905617, "optim/lr": 8.445942949978802e-06, "optim/total_tokens": 1984912424960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2525631189346313, "created_at": "2025-06-03T09:12:57.131478+00:00"} {"global_step": 236621, "acc_step": 0, "speed/wps": 5514.47118960675, "speed/FLOPS": 243711400958355.3, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04767328128218651, "optim/lr": 8.442395724884256e-06, "optim/total_tokens": 1984920813568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.262821912765503, "created_at": "2025-06-03T09:13:00.109584+00:00"} {"global_step": 236622, "acc_step": 0, "speed/wps": 5510.547392826798, "speed/FLOPS": 243537989224494.0, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05004466697573662, "optim/lr": 8.438848499789931e-06, "optim/total_tokens": 1984929202176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2557088136672974, "created_at": "2025-06-03T09:13:03.086622+00:00"} {"global_step": 236623, "acc_step": 0, "speed/wps": 5518.512324664154, "speed/FLOPS": 243889998443488.28, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05432809516787529, "optim/lr": 8.435301274695383e-06, "optim/total_tokens": 1984937590784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2441991567611694, "created_at": "2025-06-03T09:13:06.059794+00:00"} {"global_step": 236624, "acc_step": 0, "speed/wps": 5535.041471290613, "speed/FLOPS": 244620502120535.78, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.5, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04707007110118866, "optim/lr": 8.431754049600837e-06, "optim/total_tokens": 1984945979392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2753374576568604, "created_at": "2025-06-03T09:13:09.025242+00:00"} {"global_step": 236625, "acc_step": 0, "speed/wps": 5539.579745836399, "speed/FLOPS": 244821070626464.62, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04659099131822586, "optim/lr": 8.42820682450629e-06, "optim/total_tokens": 1984954368000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2718514204025269, "created_at": "2025-06-03T09:13:11.987081+00:00"} {"global_step": 236626, "acc_step": 0, "speed/wps": 5532.546893867343, "speed/FLOPS": 244510254566832.0, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04749947786331177, "optim/lr": 8.424659599411966e-06, "optim/total_tokens": 1984962756608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.28094482421875, "created_at": "2025-06-03T09:13:14.952679+00:00"} {"global_step": 236627, "acc_step": 0, "speed/wps": 5521.952841818313, "speed/FLOPS": 244042051691538.88, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.96 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.96, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04681184142827988, "optim/lr": 8.42111237431742e-06, "optim/total_tokens": 1984971145216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.258318305015564, "created_at": "2025-06-03T09:13:17.923820+00:00"} {"global_step": 236628, "acc_step": 0, "speed/wps": 5525.856671257261, "speed/FLOPS": 244214580971129.94, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04871978610754013, "optim/lr": 8.417565149222872e-06, "optim/total_tokens": 1984979533824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.260542631149292, "created_at": "2025-06-03T09:13:20.892990+00:00"} {"global_step": 236629, "acc_step": 0, "speed/wps": 5521.638413378467, "speed/FLOPS": 244028155563888.34, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048226337879896164, "optim/lr": 8.414017924128325e-06, "optim/total_tokens": 1984987922432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2712817192077637, "created_at": "2025-06-03T09:13:23.864722+00:00"} {"global_step": 236630, "acc_step": 0, "speed/wps": 5518.322571863913, "speed/FLOPS": 243881612340960.5, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04679710417985916, "optim/lr": 8.410470699034e-06, "optim/total_tokens": 1984996311040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2542047500610352, "created_at": "2025-06-03T09:13:26.839792+00:00"} {"global_step": 236631, "acc_step": 0, "speed/wps": 5516.893121794732, "speed/FLOPS": 243818437964491.4, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04738842323422432, "optim/lr": 8.406923473939454e-06, "optim/total_tokens": 1985004699648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.260730504989624, "created_at": "2025-06-03T09:13:29.817016+00:00"} {"global_step": 236632, "acc_step": 0, "speed/wps": 5525.531226185626, "speed/FLOPS": 244200197964742.56, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.8, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046895381063222885, "optim/lr": 8.403376248844908e-06, "optim/total_tokens": 1985013088256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2746949195861816, "created_at": "2025-06-03T09:13:32.786557+00:00"} {"global_step": 236633, "acc_step": 0, "speed/wps": 5542.8262842242675, "speed/FLOPS": 244964551005918.56, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.24, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05086367949843407, "optim/lr": 8.39982902375036e-06, "optim/total_tokens": 1985021476864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2688627243041992, "created_at": "2025-06-03T09:13:35.747560+00:00"} {"global_step": 236634, "acc_step": 0, "speed/wps": 5532.362279686324, "speed/FLOPS": 244502095564971.97, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04614190012216568, "optim/lr": 8.396281798656035e-06, "optim/total_tokens": 1985029865472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.269105076789856, "created_at": "2025-06-03T09:13:38.715519+00:00"} {"global_step": 236635, "acc_step": 0, "speed/wps": 5527.118732568235, "speed/FLOPS": 244270357621259.6, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04873128980398178, "optim/lr": 8.392734573561489e-06, "optim/total_tokens": 1985038254080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2690627574920654, "created_at": "2025-06-03T09:13:41.685426+00:00"} {"global_step": 236636, "acc_step": 0, "speed/wps": 5528.685137674124, "speed/FLOPS": 244339584709351.78, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 194.74, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0462416373193264, "optim/lr": 8.389187348466943e-06, "optim/total_tokens": 1985046642688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2783912420272827, "created_at": "2025-06-03T09:13:44.655080+00:00"} {"global_step": 236637, "acc_step": 0, "speed/wps": 5514.237853680516, "speed/FLOPS": 243701088704737.3, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04634131118655205, "optim/lr": 8.385640123372396e-06, "optim/total_tokens": 1985055031296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2501552104949951, "created_at": "2025-06-03T09:13:47.633219+00:00"} {"global_step": 236638, "acc_step": 0, "speed/wps": 5529.062101049428, "speed/FLOPS": 244356244561066.72, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04959674924612045, "optim/lr": 8.382092898278072e-06, "optim/total_tokens": 1985063419904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2619229555130005, "created_at": "2025-06-03T09:13:50.601132+00:00"} {"global_step": 236639, "acc_step": 0, "speed/wps": 5521.3255162141995, "speed/FLOPS": 244014327110780.6, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04779856279492378, "optim/lr": 8.378545673183524e-06, "optim/total_tokens": 1985071808512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.264795184135437, "created_at": "2025-06-03T09:13:53.573284+00:00"} {"global_step": 236640, "acc_step": 0, "speed/wps": 5518.688505607317, "speed/FLOPS": 243897784739400.25, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.95 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.95, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04668539762496948, "optim/lr": 8.374998448088977e-06, "optim/total_tokens": 1985080197120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2711509466171265, "created_at": "2025-06-03T09:13:56.550986+00:00"} {"global_step": 236641, "acc_step": 0, "speed/wps": 5535.244933144016, "speed/FLOPS": 244629494093044.0, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.51, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04953496903181076, "optim/lr": 8.37145122299443e-06, "optim/total_tokens": 1985088585728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.244621992111206, "created_at": "2025-06-03T09:13:59.514785+00:00"} {"global_step": 236642, "acc_step": 0, "speed/wps": 5527.436486071946, "speed/FLOPS": 244284400699713.78, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048846978694200516, "optim/lr": 8.367903997900106e-06, "optim/total_tokens": 1985096974336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.269859790802002, "created_at": "2025-06-03T09:14:02.489216+00:00"} {"global_step": 236643, "acc_step": 0, "speed/wps": 5516.755908108545, "speed/FLOPS": 243812373821885.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05011318624019623, "optim/lr": 8.36435677280556e-06, "optim/total_tokens": 1985105362944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.267662525177002, "created_at": "2025-06-03T09:14:05.464303+00:00"} {"global_step": 236644, "acc_step": 0, "speed/wps": 5517.125188435091, "speed/FLOPS": 243828694122170.53, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04899517446756363, "optim/lr": 8.360809547711012e-06, "optim/total_tokens": 1985113751552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.275444746017456, "created_at": "2025-06-03T09:14:08.438028+00:00"} {"global_step": 236645, "acc_step": 0, "speed/wps": 5523.650449028855, "speed/FLOPS": 244117077241103.47, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04656437784433365, "optim/lr": 8.357262322616465e-06, "optim/total_tokens": 1985122140160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2562685012817383, "created_at": "2025-06-03T09:14:11.413043+00:00"} {"global_step": 236646, "acc_step": 0, "speed/wps": 5516.1257309581615, "speed/FLOPS": 243784523217377.34, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04705674201250076, "optim/lr": 8.353715097522141e-06, "optim/total_tokens": 1985130528768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2697272300720215, "created_at": "2025-06-03T09:14:14.388082+00:00"} {"global_step": 236647, "acc_step": 0, "speed/wps": 5521.546729862657, "speed/FLOPS": 244024103621768.34, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.1008540466427803, "optim/lr": 8.350167872427595e-06, "optim/total_tokens": 1985138917376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.255212426185608, "created_at": "2025-06-03T09:14:17.363758+00:00"} {"global_step": 236648, "acc_step": 0, "speed/wps": 5516.936418997742, "speed/FLOPS": 243820351479249.28, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046992987394332886, "optim/lr": 8.346620647333048e-06, "optim/total_tokens": 1985147305984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2431960105895996, "created_at": "2025-06-03T09:14:20.342939+00:00"} {"global_step": 236649, "acc_step": 0, "speed/wps": 5516.086489817042, "speed/FLOPS": 243782788959794.25, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.052268195897340775, "optim/lr": 8.343073422238722e-06, "optim/total_tokens": 1985155694592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2517752647399902, "created_at": "2025-06-03T09:14:23.317549+00:00"} {"global_step": 236650, "acc_step": 0, "speed/wps": 5532.148657301421, "speed/FLOPS": 244492654548977.75, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04869053140282631, "optim/lr": 8.339526197144176e-06, "optim/total_tokens": 1985164083200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.254024863243103, "created_at": "2025-06-03T09:14:26.283662+00:00"} {"global_step": 236651, "acc_step": 0, "speed/wps": 5538.516536127184, "speed/FLOPS": 244774082199317.97, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.41, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04676585644483566, "optim/lr": 8.33597897204963e-06, "optim/total_tokens": 1985172471808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2764183282852173, "created_at": "2025-06-03T09:14:29.250814+00:00"} {"global_step": 236652, "acc_step": 0, "speed/wps": 5519.573162993376, "speed/FLOPS": 243936882067777.1, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04991207644343376, "optim/lr": 8.332431746955083e-06, "optim/total_tokens": 1985180860416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2764250040054321, "created_at": "2025-06-03T09:14:32.227974+00:00"} {"global_step": 236653, "acc_step": 0, "speed/wps": 5506.995445137014, "speed/FLOPS": 243381011317121.94, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05025020241737366, "optim/lr": 8.328884521860758e-06, "optim/total_tokens": 1985189249024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2645195722579956, "created_at": "2025-06-03T09:14:35.212867+00:00"} {"global_step": 236654, "acc_step": 0, "speed/wps": 5505.6937485448525, "speed/FLOPS": 243323482990435.53, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.94 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.94, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04681551083922386, "optim/lr": 8.325337296766212e-06, "optim/total_tokens": 1985197637632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2496944665908813, "created_at": "2025-06-03T09:14:38.198005+00:00"} {"global_step": 236655, "acc_step": 0, "speed/wps": 5522.733901489359, "speed/FLOPS": 244076570531173.3, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05262180045247078, "optim/lr": 8.321790071671664e-06, "optim/total_tokens": 1985206026240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2621101140975952, "created_at": "2025-06-03T09:14:41.172971+00:00"} {"global_step": 236656, "acc_step": 0, "speed/wps": 5520.758630154949, "speed/FLOPS": 243989273648547.62, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05299948528409004, "optim/lr": 8.318242846577117e-06, "optim/total_tokens": 1985214414848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2692357301712036, "created_at": "2025-06-03T09:14:44.148334+00:00"} {"global_step": 236657, "acc_step": 0, "speed/wps": 5530.277583782241, "speed/FLOPS": 244409962676452.47, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04857796058058739, "optim/lr": 8.314695621482793e-06, "optim/total_tokens": 1985222803456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2697224617004395, "created_at": "2025-06-03T09:14:47.115120+00:00"} {"global_step": 236658, "acc_step": 0, "speed/wps": 5531.880593050782, "speed/FLOPS": 244480807481176.75, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 194.64, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0555119626224041, "optim/lr": 8.311148396388247e-06, "optim/total_tokens": 1985231192064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.273492693901062, "created_at": "2025-06-03T09:14:50.085684+00:00"} {"global_step": 236659, "acc_step": 0, "speed/wps": 5531.1261019993035, "speed/FLOPS": 244447462838536.66, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.052853070199489594, "optim/lr": 8.3076011712937e-06, "optim/total_tokens": 1985239580672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2756799459457397, "created_at": "2025-06-03T09:14:53.057030+00:00"} {"global_step": 236660, "acc_step": 0, "speed/wps": 5513.987456516737, "speed/FLOPS": 243690022431747.16, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04674083739519119, "optim/lr": 8.304053946199152e-06, "optim/total_tokens": 1985247969280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2711905241012573, "created_at": "2025-06-03T09:14:56.032571+00:00"} {"global_step": 236661, "acc_step": 0, "speed/wps": 5518.637771409033, "speed/FLOPS": 243895542547517.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047874290496110916, "optim/lr": 8.300506721104828e-06, "optim/total_tokens": 1985256357888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2665754556655884, "created_at": "2025-06-03T09:14:59.007082+00:00"} {"global_step": 236662, "acc_step": 0, "speed/wps": 5518.885944322561, "speed/FLOPS": 243906510520031.06, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.053397681564092636, "optim/lr": 8.296959496010281e-06, "optim/total_tokens": 1985264746496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2692275047302246, "created_at": "2025-06-03T09:15:01.981168+00:00"} {"global_step": 236663, "acc_step": 0, "speed/wps": 5509.456048102448, "speed/FLOPS": 243489757373686.4, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05390793830156326, "optim/lr": 8.293412270915735e-06, "optim/total_tokens": 1985273135104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2663805484771729, "created_at": "2025-06-03T09:15:04.959345+00:00"} {"global_step": 236664, "acc_step": 0, "speed/wps": 5516.688469388075, "speed/FLOPS": 243809393375623.12, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05230134353041649, "optim/lr": 8.289865045821188e-06, "optim/total_tokens": 1985281523712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2730205059051514, "created_at": "2025-06-03T09:15:07.937293+00:00"} {"global_step": 236665, "acc_step": 0, "speed/wps": 5507.125011470356, "speed/FLOPS": 243386737485875.03, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.93 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.93, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05854038894176483, "optim/lr": 8.286317820726862e-06, "optim/total_tokens": 1985289912320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2674399614334106, "created_at": "2025-06-03T09:15:10.919523+00:00"} {"global_step": 236666, "acc_step": 0, "speed/wps": 5520.455615126926, "speed/FLOPS": 243975881935280.5, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04749678447842598, "optim/lr": 8.282770595632316e-06, "optim/total_tokens": 1985298300928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2683273553848267, "created_at": "2025-06-03T09:15:13.891732+00:00"} {"global_step": 236667, "acc_step": 0, "speed/wps": 5523.122502096164, "speed/FLOPS": 244093744688955.88, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04870330169796944, "optim/lr": 8.27922337053777e-06, "optim/total_tokens": 1985306689536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2432689666748047, "created_at": "2025-06-03T09:15:16.867590+00:00"} {"global_step": 236668, "acc_step": 0, "speed/wps": 5516.3004523089, "speed/FLOPS": 243792245006775.06, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05139528587460518, "optim/lr": 8.275676145443223e-06, "optim/total_tokens": 1985315078144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.267686367034912, "created_at": "2025-06-03T09:15:19.845173+00:00"} {"global_step": 236669, "acc_step": 0, "speed/wps": 5519.152105210549, "speed/FLOPS": 243918273468945.22, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05297393724322319, "optim/lr": 8.272128920348899e-06, "optim/total_tokens": 1985323466752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.265166997909546, "created_at": "2025-06-03T09:15:22.820944+00:00"} {"global_step": 236670, "acc_step": 0, "speed/wps": 5518.807203549296, "speed/FLOPS": 243903030580884.56, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046669092029333115, "optim/lr": 8.26858169525435e-06, "optim/total_tokens": 1985331855360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2508293390274048, "created_at": "2025-06-03T09:15:25.794076+00:00"} {"global_step": 236671, "acc_step": 0, "speed/wps": 5517.066706142526, "speed/FLOPS": 243826109504178.66, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049885738641023636, "optim/lr": 8.265034470159804e-06, "optim/total_tokens": 1985340243968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2628380060195923, "created_at": "2025-06-03T09:15:28.768238+00:00"} {"global_step": 236672, "acc_step": 0, "speed/wps": 5515.911934213758, "speed/FLOPS": 243775074495585.7, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05329975485801697, "optim/lr": 8.261487245065258e-06, "optim/total_tokens": 1985348632576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2605773210525513, "created_at": "2025-06-03T09:15:31.743229+00:00"} {"global_step": 236673, "acc_step": 0, "speed/wps": 5515.345687149809, "speed/FLOPS": 243750049273674.34, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04746653884649277, "optim/lr": 8.257940019970933e-06, "optim/total_tokens": 1985357021184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.272376298904419, "created_at": "2025-06-03T09:15:34.721136+00:00"} {"global_step": 236674, "acc_step": 0, "speed/wps": 5519.629611605467, "speed/FLOPS": 243939376807501.3, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05103905126452446, "optim/lr": 8.254392794876387e-06, "optim/total_tokens": 1985365409792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2656103372573853, "created_at": "2025-06-03T09:15:37.694001+00:00"} {"global_step": 236675, "acc_step": 0, "speed/wps": 5525.337559959967, "speed/FLOPS": 244191638908842.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048047490417957306, "optim/lr": 8.250845569781839e-06, "optim/total_tokens": 1985373798400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2531386613845825, "created_at": "2025-06-03T09:15:40.663647+00:00"} {"global_step": 236676, "acc_step": 0, "speed/wps": 5528.101347117292, "speed/FLOPS": 244313784154850.72, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04723940044641495, "optim/lr": 8.247298344687514e-06, "optim/total_tokens": 1985382187008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2568459510803223, "created_at": "2025-06-03T09:15:43.632531+00:00"} {"global_step": 236677, "acc_step": 0, "speed/wps": 5531.38116438697, "speed/FLOPS": 244458735290543.9, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049771998077631, "optim/lr": 8.243751119592968e-06, "optim/total_tokens": 1985390575616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.270405650138855, "created_at": "2025-06-03T09:15:46.600395+00:00"} {"global_step": 236678, "acc_step": 0, "speed/wps": 5516.096768769669, "speed/FLOPS": 243783243236887.9, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.92 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.92, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047314394265413284, "optim/lr": 8.240203894498422e-06, "optim/total_tokens": 1985398964224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2675342559814453, "created_at": "2025-06-03T09:15:49.574874+00:00"} {"global_step": 236679, "acc_step": 0, "speed/wps": 5519.726708066667, "speed/FLOPS": 243943667974101.6, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04832761362195015, "optim/lr": 8.236656669403875e-06, "optim/total_tokens": 1985407352832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2539678812026978, "created_at": "2025-06-03T09:15:52.547410+00:00"} {"global_step": 236680, "acc_step": 0, "speed/wps": 5515.728610536351, "speed/FLOPS": 243766972527379.9, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047035545110702515, "optim/lr": 8.23310944430955e-06, "optim/total_tokens": 1985415741440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2590069770812988, "created_at": "2025-06-03T09:15:55.525203+00:00"} {"global_step": 236681, "acc_step": 0, "speed/wps": 5513.616452895278, "speed/FLOPS": 243673625970647.3, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04900740459561348, "optim/lr": 8.229562219215003e-06, "optim/total_tokens": 1985424130048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2758413553237915, "created_at": "2025-06-03T09:15:58.501509+00:00"} {"global_step": 236682, "acc_step": 0, "speed/wps": 5516.795058865393, "speed/FLOPS": 243814104084946.2, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.050400376319885254, "optim/lr": 8.226014994120456e-06, "optim/total_tokens": 1985432518656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2647432088851929, "created_at": "2025-06-03T09:16:01.480154+00:00"} {"global_step": 236683, "acc_step": 0, "speed/wps": 5525.193076658864, "speed/FLOPS": 244185253486465.84, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04645164683461189, "optim/lr": 8.22246776902591e-06, "optim/total_tokens": 1985440907264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.252708911895752, "created_at": "2025-06-03T09:16:04.451099+00:00"} {"global_step": 236684, "acc_step": 0, "speed/wps": 5521.165076705448, "speed/FLOPS": 244007236505697.62, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05003290995955467, "optim/lr": 8.218920543931585e-06, "optim/total_tokens": 1985449295872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2616552114486694, "created_at": "2025-06-03T09:16:07.423318+00:00"} {"global_step": 236685, "acc_step": 0, "speed/wps": 5522.416934143241, "speed/FLOPS": 244062562196860.84, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048385221511125565, "optim/lr": 8.215373318837039e-06, "optim/total_tokens": 1985457684480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2505466938018799, "created_at": "2025-06-03T09:16:10.394389+00:00"} {"global_step": 236686, "acc_step": 0, "speed/wps": 5528.256208294652, "speed/FLOPS": 244320628226238.72, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047697704285383224, "optim/lr": 8.211826093742491e-06, "optim/total_tokens": 1985466073088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2766135931015015, "created_at": "2025-06-03T09:16:13.364704+00:00"} {"global_step": 236687, "acc_step": 0, "speed/wps": 5516.946858992233, "speed/FLOPS": 243820812873569.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04874226823449135, "optim/lr": 8.208278868647944e-06, "optim/total_tokens": 1985474461696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2589740753173828, "created_at": "2025-06-03T09:16:16.341881+00:00"} {"global_step": 236688, "acc_step": 0, "speed/wps": 5519.3033584552895, "speed/FLOPS": 243924958088178.47, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047221917659044266, "optim/lr": 8.20473164355362e-06, "optim/total_tokens": 1985482850304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2678310871124268, "created_at": "2025-06-03T09:16:19.314473+00:00"} {"global_step": 236689, "acc_step": 0, "speed/wps": 5516.594088049682, "speed/FLOPS": 243805222203553.66, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04742572456598282, "optim/lr": 8.201184418459074e-06, "optim/total_tokens": 1985491238912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2679784297943115, "created_at": "2025-06-03T09:16:22.288699+00:00"} {"global_step": 236690, "acc_step": 0, "speed/wps": 5520.500368875168, "speed/FLOPS": 243977859821882.34, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047328926622867584, "optim/lr": 8.197637193364527e-06, "optim/total_tokens": 1985499627520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2539454698562622, "created_at": "2025-06-03T09:16:25.261918+00:00"} {"global_step": 236691, "acc_step": 0, "speed/wps": 5506.830507822487, "speed/FLOPS": 243373721932045.53, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.91 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.91, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04742981866002083, "optim/lr": 8.194089968269979e-06, "optim/total_tokens": 1985508016128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2644332647323608, "created_at": "2025-06-03T09:16:28.241314+00:00"} {"global_step": 236692, "acc_step": 0, "speed/wps": 5529.581733444475, "speed/FLOPS": 244379209653208.1, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04713073745369911, "optim/lr": 8.190542743175655e-06, "optim/total_tokens": 1985516404736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.261157751083374, "created_at": "2025-06-03T09:16:31.208890+00:00"} {"global_step": 236693, "acc_step": 0, "speed/wps": 5526.310274868037, "speed/FLOPS": 244234627928972.47, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047249939292669296, "optim/lr": 8.186995518081108e-06, "optim/total_tokens": 1985524793344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2780052423477173, "created_at": "2025-06-03T09:16:34.183469+00:00"} {"global_step": 236694, "acc_step": 0, "speed/wps": 5521.893252726936, "speed/FLOPS": 244039418158704.66, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04775812104344368, "optim/lr": 8.183448292986562e-06, "optim/total_tokens": 1985533181952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2599685192108154, "created_at": "2025-06-03T09:16:37.157488+00:00"} {"global_step": 236695, "acc_step": 0, "speed/wps": 5512.879547500613, "speed/FLOPS": 243641058524026.88, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046201273798942566, "optim/lr": 8.179901067892015e-06, "optim/total_tokens": 1985541570560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2545578479766846, "created_at": "2025-06-03T09:16:40.136607+00:00"} {"global_step": 236696, "acc_step": 0, "speed/wps": 5515.95226505195, "speed/FLOPS": 243776856912201.8, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046518195420503616, "optim/lr": 8.176353842797691e-06, "optim/total_tokens": 1985549959168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2628217935562134, "created_at": "2025-06-03T09:16:43.111548+00:00"} {"global_step": 236697, "acc_step": 0, "speed/wps": 5520.19468001883, "speed/FLOPS": 243964349939089.6, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04719431698322296, "optim/lr": 8.172806617703143e-06, "optim/total_tokens": 1985558347776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2667704820632935, "created_at": "2025-06-03T09:16:46.086841+00:00"} {"global_step": 236698, "acc_step": 0, "speed/wps": 5515.750096648746, "speed/FLOPS": 243767922103571.88, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04773464426398277, "optim/lr": 8.169259392608597e-06, "optim/total_tokens": 1985566736384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2686647176742554, "created_at": "2025-06-03T09:16:49.066503+00:00"} {"global_step": 236699, "acc_step": 0, "speed/wps": 5517.435255009143, "speed/FLOPS": 243842397477679.0, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.9 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.9, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04756586253643036, "optim/lr": 8.16571216751405e-06, "optim/total_tokens": 1985575124992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.255104422569275, "created_at": "2025-06-03T09:16:52.044109+00:00"} {"global_step": 236700, "acc_step": 0, "speed/wps": 5538.048634813248, "speed/FLOPS": 244753403356178.03, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.89 hours", "speed/est_time_elapsed_hrs": 194.46, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.89, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048267558217048645, "optim/lr": 8.162164942419726e-06, "optim/total_tokens": 1985583513600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2755012512207031, "created_at": "2025-06-03T09:16:55.007305+00:00"} {"global_step": 236701, "acc_step": 0, "speed/wps": 243.7918406366569, "speed/FLOPS": 10774351516380.443, "speed/curr_iter_time": 2.8863, "speed/data_load_time": 0.0018, "speed/curr_step_time": 2.8863, "speed/est_time_elapsed": "7.91 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 189.78, "speed/est_time_elapsed_days": 7.91, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046946339309215546, "optim/lr": 8.15861771732518e-06, "optim/total_tokens": 1985591902208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.261470913887024, "created_at": "2025-06-03T09:18:02.219550+00:00"} {"global_step": 236702, "acc_step": 0, "speed/wps": 5583.108135370911, "speed/FLOPS": 246744802645395.28, "speed/curr_iter_time": 2.9334, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9334, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 192.87, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05055492743849754, "optim/lr": 8.155070492230631e-06, "optim/total_tokens": 1985600290816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2642894983291626, "created_at": "2025-06-03T09:18:05.162847+00:00"} {"global_step": 236703, "acc_step": 0, "speed/wps": 5570.993722921022, "speed/FLOPS": 246209407622294.16, "speed/curr_iter_time": 2.9399, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9399, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04706196486949921, "optim/lr": 8.151523267136307e-06, "optim/total_tokens": 1985608679424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2581485509872437, "created_at": "2025-06-03T09:18:08.108738+00:00"} {"global_step": 236704, "acc_step": 0, "speed/wps": 5572.05619854305, "speed/FLOPS": 246256363606544.6, "speed/curr_iter_time": 2.9394, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9394, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 193.27, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048725444823503494, "optim/lr": 8.14797604204176e-06, "optim/total_tokens": 1985617068032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.267944097518921, "created_at": "2025-06-03T09:18:11.057378+00:00"} {"global_step": 236705, "acc_step": 0, "speed/wps": 5558.010203776897, "speed/FLOPS": 245635602531799.16, "speed/curr_iter_time": 2.9455, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9455, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 193.67, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04898877814412117, "optim/lr": 8.144428816947214e-06, "optim/total_tokens": 1985625456640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2588485479354858, "created_at": "2025-06-03T09:18:14.010746+00:00"} {"global_step": 236706, "acc_step": 0, "speed/wps": 5542.713329633331, "speed/FLOPS": 244959558991153.2, "speed/curr_iter_time": 2.955, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.955, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.3, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046206116676330566, "optim/lr": 8.140881591852668e-06, "optim/total_tokens": 1985633845248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2508411407470703, "created_at": "2025-06-03T09:18:16.972802+00:00"} {"global_step": 236707, "acc_step": 0, "speed/wps": 5539.234447391631, "speed/FLOPS": 244805810202603.56, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.42, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04686490818858147, "optim/lr": 8.137334366758341e-06, "optim/total_tokens": 1985642233856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2525607347488403, "created_at": "2025-06-03T09:18:19.938848+00:00"} {"global_step": 236708, "acc_step": 0, "speed/wps": 5542.837857614679, "speed/FLOPS": 244965062490536.75, "speed/curr_iter_time": 2.9535, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9535, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.09696295112371445, "optim/lr": 8.133787141663795e-06, "optim/total_tokens": 1985650622464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.256441354751587, "created_at": "2025-06-03T09:18:22.902833+00:00"} {"global_step": 236709, "acc_step": 0, "speed/wps": 5536.573099125539, "speed/FLOPS": 244688192231257.56, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04679381474852562, "optim/lr": 8.130239916569249e-06, "optim/total_tokens": 1985659011072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2663925886154175, "created_at": "2025-06-03T09:18:25.869282+00:00"} {"global_step": 236710, "acc_step": 0, "speed/wps": 5525.836151663184, "speed/FLOPS": 244213674110100.53, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.89 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.89, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0475931279361248, "optim/lr": 8.126692691474702e-06, "optim/total_tokens": 1985667399680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.254601240158081, "created_at": "2025-06-03T09:18:28.841518+00:00"} {"global_step": 236711, "acc_step": 0, "speed/wps": 5516.8826201530455, "speed/FLOPS": 243817973845681.12, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.89 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.89, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046508196741342545, "optim/lr": 8.123145466380378e-06, "optim/total_tokens": 1985675788288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2533454895019531, "created_at": "2025-06-03T09:18:31.815953+00:00"} {"global_step": 236712, "acc_step": 0, "speed/wps": 5535.969608027005, "speed/FLOPS": 244661521013649.84, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04650372266769409, "optim/lr": 8.119598241285831e-06, "optim/total_tokens": 1985684176896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2663993835449219, "created_at": "2025-06-03T09:18:34.780085+00:00"} {"global_step": 236713, "acc_step": 0, "speed/wps": 5531.561733126056, "speed/FLOPS": 244466715504576.9, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04756680876016617, "optim/lr": 8.116051016191283e-06, "optim/total_tokens": 1985692565504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.267288327217102, "created_at": "2025-06-03T09:18:37.749890+00:00"} {"global_step": 236714, "acc_step": 0, "speed/wps": 5522.546075158237, "speed/FLOPS": 244068269568720.03, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046452052891254425, "optim/lr": 8.112503791096737e-06, "optim/total_tokens": 1985700954112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2525304555892944, "created_at": "2025-06-03T09:18:40.720927+00:00"} {"global_step": 236715, "acc_step": 0, "speed/wps": 5522.893384505478, "speed/FLOPS": 244083618864177.7, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04991859942674637, "optim/lr": 8.108956566002412e-06, "optim/total_tokens": 1985709342720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2493358850479126, "created_at": "2025-06-03T09:18:43.695556+00:00"} {"global_step": 236716, "acc_step": 0, "speed/wps": 5527.562598527557, "speed/FLOPS": 244289974224749.72, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048389922827482224, "optim/lr": 8.105409340907866e-06, "optim/total_tokens": 1985717731328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2691453695297241, "created_at": "2025-06-03T09:18:46.667488+00:00"} {"global_step": 236717, "acc_step": 0, "speed/wps": 5529.0716168934205, "speed/FLOPS": 244356665112664.7, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046532679349184036, "optim/lr": 8.10186211581332e-06, "optim/total_tokens": 1985726119936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2566505670547485, "created_at": "2025-06-03T09:18:49.638392+00:00"} {"global_step": 236718, "acc_step": 0, "speed/wps": 5511.24410069982, "speed/FLOPS": 243568780146407.38, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047144193202257156, "optim/lr": 8.098314890718771e-06, "optim/total_tokens": 1985734508544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2543830871582031, "created_at": "2025-06-03T09:18:52.615562+00:00"} {"global_step": 236719, "acc_step": 0, "speed/wps": 5515.399502278112, "speed/FLOPS": 243752427626894.53, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04928765445947647, "optim/lr": 8.094767665624447e-06, "optim/total_tokens": 1985742897152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2573730945587158, "created_at": "2025-06-03T09:18:55.595665+00:00"} {"global_step": 236720, "acc_step": 0, "speed/wps": 5532.364354843527, "speed/FLOPS": 244502187276298.72, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04835648834705353, "optim/lr": 8.0912204405299e-06, "optim/total_tokens": 1985751285760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2714110612869263, "created_at": "2025-06-03T09:18:58.563396+00:00"} {"global_step": 236721, "acc_step": 0, "speed/wps": 5534.59702245444, "speed/FLOPS": 244600859756872.3, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.52, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04642877355217934, "optim/lr": 8.087673215435354e-06, "optim/total_tokens": 1985759674368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2561156749725342, "created_at": "2025-06-03T09:19:01.533385+00:00"} {"global_step": 236722, "acc_step": 0, "speed/wps": 5522.521857615662, "speed/FLOPS": 244067199277294.84, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04690973833203316, "optim/lr": 8.084125990340808e-06, "optim/total_tokens": 1985768062976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2761904001235962, "created_at": "2025-06-03T09:19:04.505705+00:00"} {"global_step": 236723, "acc_step": 0, "speed/wps": 5523.398854685438, "speed/FLOPS": 244105958058901.0, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04761223495006561, "optim/lr": 8.080578765246482e-06, "optim/total_tokens": 1985776451584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.258993148803711, "created_at": "2025-06-03T09:19:07.477824+00:00"} {"global_step": 236724, "acc_step": 0, "speed/wps": 5519.597618779216, "speed/FLOPS": 243937962888335.12, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04843602702021599, "optim/lr": 8.077031540151935e-06, "optim/total_tokens": 1985784840192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2543706893920898, "created_at": "2025-06-03T09:19:10.454308+00:00"} {"global_step": 236725, "acc_step": 0, "speed/wps": 5522.139160921268, "speed/FLOPS": 244050286042221.88, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04695538058876991, "optim/lr": 8.073484315057389e-06, "optim/total_tokens": 1985793228800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2731192111968994, "created_at": "2025-06-03T09:19:13.425710+00:00"} {"global_step": 236726, "acc_step": 0, "speed/wps": 5524.368594097551, "speed/FLOPS": 244148815577340.12, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.052481576800346375, "optim/lr": 8.069937089962842e-06, "optim/total_tokens": 1985801617408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.254702091217041, "created_at": "2025-06-03T09:19:16.396276+00:00"} {"global_step": 236727, "acc_step": 0, "speed/wps": 5513.662830801849, "speed/FLOPS": 243675675636734.12, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.88 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.88, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04854753240942955, "optim/lr": 8.066389864868518e-06, "optim/total_tokens": 1985810006016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2639678716659546, "created_at": "2025-06-03T09:19:19.375451+00:00"} {"global_step": 236728, "acc_step": 0, "speed/wps": 5527.929365360793, "speed/FLOPS": 244306183441495.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04948342964053154, "optim/lr": 8.06284263977397e-06, "optim/total_tokens": 1985818394624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2434604167938232, "created_at": "2025-06-03T09:19:22.347365+00:00"} {"global_step": 236729, "acc_step": 0, "speed/wps": 5535.9534986435065, "speed/FLOPS": 244660809061354.5, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048961859196424484, "optim/lr": 8.059295414679424e-06, "optim/total_tokens": 1985826783232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2556767463684082, "created_at": "2025-06-03T09:19:25.311371+00:00"} {"global_step": 236730, "acc_step": 0, "speed/wps": 5534.378860397066, "speed/FLOPS": 244591218110591.03, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04686347767710686, "optim/lr": 8.055748189585099e-06, "optim/total_tokens": 1985835171840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2666058540344238, "created_at": "2025-06-03T09:19:28.277866+00:00"} {"global_step": 236731, "acc_step": 0, "speed/wps": 5541.36374792731, "speed/FLOPS": 244899914387532.44, "speed/curr_iter_time": 2.9558, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9558, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04937085509300232, "optim/lr": 8.052200964490553e-06, "optim/total_tokens": 1985843560448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.266115665435791, "created_at": "2025-06-03T09:19:31.241975+00:00"} {"global_step": 236732, "acc_step": 0, "speed/wps": 5530.140797841878, "speed/FLOPS": 244403917438022.34, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047091685235500336, "optim/lr": 8.048653739396006e-06, "optim/total_tokens": 1985851949056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2606360912322998, "created_at": "2025-06-03T09:19:34.212680+00:00"} {"global_step": 236733, "acc_step": 0, "speed/wps": 5527.963763808992, "speed/FLOPS": 244307703676839.06, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04702170193195343, "optim/lr": 8.04510651430146e-06, "optim/total_tokens": 1985860337664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2561533451080322, "created_at": "2025-06-03T09:19:37.182980+00:00"} {"global_step": 236734, "acc_step": 0, "speed/wps": 5516.452117536354, "speed/FLOPS": 243798947833535.53, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04930013790726662, "optim/lr": 8.041559289207134e-06, "optim/total_tokens": 1985868726272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2679152488708496, "created_at": "2025-06-03T09:19:40.157672+00:00"} {"global_step": 236735, "acc_step": 0, "speed/wps": 5521.5193094085735, "speed/FLOPS": 244022891778048.44, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0481562614440918, "optim/lr": 8.038012064112587e-06, "optim/total_tokens": 1985877114880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2557830810546875, "created_at": "2025-06-03T09:19:43.129061+00:00"} {"global_step": 236736, "acc_step": 0, "speed/wps": 5522.648387810695, "speed/FLOPS": 244072791264275.03, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04680795595049858, "optim/lr": 8.034464839018041e-06, "optim/total_tokens": 1985885503488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2727986574172974, "created_at": "2025-06-03T09:19:46.104006+00:00"} {"global_step": 236737, "acc_step": 0, "speed/wps": 5526.977754835872, "speed/FLOPS": 244264127127078.6, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05133684724569321, "optim/lr": 8.030917613923494e-06, "optim/total_tokens": 1985893892096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2726919651031494, "created_at": "2025-06-03T09:19:49.076614+00:00"} {"global_step": 236738, "acc_step": 0, "speed/wps": 5529.714589160002, "speed/FLOPS": 244385081195817.2, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049130577594041824, "optim/lr": 8.02737038882917e-06, "optim/total_tokens": 1985902280704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2524830102920532, "created_at": "2025-06-03T09:19:52.043822+00:00"} {"global_step": 236739, "acc_step": 0, "speed/wps": 5533.170552659823, "speed/FLOPS": 244537817093284.53, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04733797907829285, "optim/lr": 8.023823163734622e-06, "optim/total_tokens": 1985910669312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2585039138793945, "created_at": "2025-06-03T09:19:55.011442+00:00"} {"global_step": 236740, "acc_step": 0, "speed/wps": 5516.066787301069, "speed/FLOPS": 243781918209434.84, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05046262592077255, "optim/lr": 8.020275938640076e-06, "optim/total_tokens": 1985919057920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2681119441986084, "created_at": "2025-06-03T09:19:57.985994+00:00"} {"global_step": 236741, "acc_step": 0, "speed/wps": 5525.288658321762, "speed/FLOPS": 244189477706734.66, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04963222146034241, "optim/lr": 8.016728713545529e-06, "optim/total_tokens": 1985927446528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2548587322235107, "created_at": "2025-06-03T09:20:00.959746+00:00"} {"global_step": 236742, "acc_step": 0, "speed/wps": 5510.285431112374, "speed/FLOPS": 243526411857558.06, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04804998263716698, "optim/lr": 8.013181488451205e-06, "optim/total_tokens": 1985935835136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2733633518218994, "created_at": "2025-06-03T09:20:03.940946+00:00"} {"global_step": 236743, "acc_step": 0, "speed/wps": 5506.825692427612, "speed/FLOPS": 243373509116239.5, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.050665922462940216, "optim/lr": 8.009634263356658e-06, "optim/total_tokens": 1985944223744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26619553565979, "created_at": "2025-06-03T09:20:06.923369+00:00"} {"global_step": 236744, "acc_step": 0, "speed/wps": 5493.87794756271, "speed/FLOPS": 242801285065776.78, "speed/curr_iter_time": 2.9812, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9812, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.87 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.87, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049070656299591064, "optim/lr": 8.00608703826211e-06, "optim/total_tokens": 1985952612352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2782719135284424, "created_at": "2025-06-03T09:20:09.914966+00:00"} {"global_step": 236745, "acc_step": 0, "speed/wps": 5518.095370711069, "speed/FLOPS": 243871571212925.72, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04653766378760338, "optim/lr": 8.002539813167564e-06, "optim/total_tokens": 1985961000960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2584542036056519, "created_at": "2025-06-03T09:20:12.889757+00:00"} {"global_step": 236746, "acc_step": 0, "speed/wps": 5520.790467086044, "speed/FLOPS": 243990680677945.84, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04651350528001785, "optim/lr": 7.99899258807324e-06, "optim/total_tokens": 1985969389568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2720896005630493, "created_at": "2025-06-03T09:20:15.865220+00:00"} {"global_step": 236747, "acc_step": 0, "speed/wps": 5514.500099291416, "speed/FLOPS": 243712678618444.34, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.052501749247312546, "optim/lr": 7.995445362978693e-06, "optim/total_tokens": 1985977778176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 357, "loss/out": 1.2700634002685547, "created_at": "2025-06-03T09:20:18.840745+00:00"} {"global_step": 236748, "acc_step": 0, "speed/wps": 5525.652542185855, "speed/FLOPS": 244205559511001.1, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04686975106596947, "optim/lr": 7.991898137884147e-06, "optim/total_tokens": 1985986166784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2709696292877197, "created_at": "2025-06-03T09:20:21.810123+00:00"} {"global_step": 236749, "acc_step": 0, "speed/wps": 5526.675160560399, "speed/FLOPS": 244250754008920.6, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04606761038303375, "optim/lr": 7.988350912789598e-06, "optim/total_tokens": 1985994555392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2756563425064087, "created_at": "2025-06-03T09:20:24.781201+00:00"} {"global_step": 236750, "acc_step": 0, "speed/wps": 5521.971318944316, "speed/FLOPS": 244042868285933.75, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04772903025150299, "optim/lr": 7.984803687695274e-06, "optim/total_tokens": 1986002944000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2761248350143433, "created_at": "2025-06-03T09:20:27.753206+00:00"} {"global_step": 236751, "acc_step": 0, "speed/wps": 5515.912563743527, "speed/FLOPS": 243775102317579.25, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04696912690997124, "optim/lr": 7.981256462600728e-06, "optim/total_tokens": 1986011332608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.268126130104065, "created_at": "2025-06-03T09:20:30.731696+00:00"} {"global_step": 236752, "acc_step": 0, "speed/wps": 5521.310108844448, "speed/FLOPS": 244013646183899.66, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04960109293460846, "optim/lr": 7.977709237506181e-06, "optim/total_tokens": 1986019721216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2677922248840332, "created_at": "2025-06-03T09:20:33.706762+00:00"} {"global_step": 236753, "acc_step": 0, "speed/wps": 5517.823692221368, "speed/FLOPS": 243859564414257.5, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04747483879327774, "optim/lr": 7.974162012411635e-06, "optim/total_tokens": 1986028109824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2745790481567383, "created_at": "2025-06-03T09:20:36.682353+00:00"} {"global_step": 236754, "acc_step": 0, "speed/wps": 5507.984274605695, "speed/FLOPS": 243424712518349.56, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.86 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.86, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.049034178256988525, "optim/lr": 7.97061478731731e-06, "optim/total_tokens": 1986036498432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2726454734802246, "created_at": "2025-06-03T09:20:39.666521+00:00"} {"global_step": 236755, "acc_step": 0, "speed/wps": 5526.1786858605965, "speed/FLOPS": 244228812368377.22, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04804702475667, "optim/lr": 7.967067562222762e-06, "optim/total_tokens": 1986044887040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2665541172027588, "created_at": "2025-06-03T09:20:42.635843+00:00"} {"global_step": 236756, "acc_step": 0, "speed/wps": 5514.889430318461, "speed/FLOPS": 243729885057062.9, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04786330834031105, "optim/lr": 7.963520337128216e-06, "optim/total_tokens": 1986053275648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 358, "loss/out": 1.239935278892517, "created_at": "2025-06-03T09:20:45.614856+00:00"} {"global_step": 236757, "acc_step": 0, "speed/wps": 5520.417742373641, "speed/FLOPS": 243974208153435.62, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04747888445854187, "optim/lr": 7.959973112033891e-06, "optim/total_tokens": 1986061664256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.258552074432373, "created_at": "2025-06-03T09:20:48.587130+00:00"} {"global_step": 236758, "acc_step": 0, "speed/wps": 5518.703990104317, "speed/FLOPS": 243898469074910.8, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0473974235355854, "optim/lr": 7.956425886939345e-06, "optim/total_tokens": 1986070052864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2652673721313477, "created_at": "2025-06-03T09:20:51.560333+00:00"} {"global_step": 236759, "acc_step": 0, "speed/wps": 5515.7253627959935, "speed/FLOPS": 243766828993879.56, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04807247593998909, "optim/lr": 7.952878661844799e-06, "optim/total_tokens": 1986078441472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2827975749969482, "created_at": "2025-06-03T09:20:54.534791+00:00"} {"global_step": 236760, "acc_step": 0, "speed/wps": 5506.640340170693, "speed/FLOPS": 243365317495202.53, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04647642746567726, "optim/lr": 7.94933143675025e-06, "optim/total_tokens": 1986086830080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2579292058944702, "created_at": "2025-06-03T09:20:57.514996+00:00"} {"global_step": 236761, "acc_step": 0, "speed/wps": 5510.053261262664, "speed/FLOPS": 243516151138553.88, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04679277539253235, "optim/lr": 7.945784211655926e-06, "optim/total_tokens": 1986095218688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2483031749725342, "created_at": "2025-06-03T09:21:00.492778+00:00"} {"global_step": 236762, "acc_step": 0, "speed/wps": 5508.678697065866, "speed/FLOPS": 243455402436712.78, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.85 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.85, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04962703213095665, "optim/lr": 7.94223698656138e-06, "optim/total_tokens": 1986103607296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2579748630523682, "created_at": "2025-06-03T09:21:03.472467+00:00"} {"global_step": 236763, "acc_step": 0, "speed/wps": 5536.723333121219, "speed/FLOPS": 244694831804899.34, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 194.56, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04745732620358467, "optim/lr": 7.938689761466833e-06, "optim/total_tokens": 1986111995904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.27055823802948, "created_at": "2025-06-03T09:21:06.436086+00:00"} {"global_step": 236764, "acc_step": 0, "speed/wps": 5518.983048383783, "speed/FLOPS": 243910802022513.47, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048458825796842575, "optim/lr": 7.935142536372287e-06, "optim/total_tokens": 1986120384512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2632269859313965, "created_at": "2025-06-03T09:21:09.412735+00:00"} {"global_step": 236765, "acc_step": 0, "speed/wps": 5523.418255840006, "speed/FLOPS": 244106815490628.8, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048678766936063766, "optim/lr": 7.93159531127796e-06, "optim/total_tokens": 1986128773120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2683287858963013, "created_at": "2025-06-03T09:21:12.387798+00:00"} {"global_step": 236766, "acc_step": 0, "speed/wps": 5510.966697581454, "speed/FLOPS": 243556520348453.5, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.050159964710474014, "optim/lr": 7.928048086183414e-06, "optim/total_tokens": 1986137161728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2724175453186035, "created_at": "2025-06-03T09:21:15.368658+00:00"} {"global_step": 236767, "acc_step": 0, "speed/wps": 5520.549159373198, "speed/FLOPS": 243980016112162.84, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05020315945148468, "optim/lr": 7.924500861088868e-06, "optim/total_tokens": 1986145550336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2825819253921509, "created_at": "2025-06-03T09:21:18.341911+00:00"} {"global_step": 236768, "acc_step": 0, "speed/wps": 5515.797540749904, "speed/FLOPS": 243770018890002.16, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04859497770667076, "optim/lr": 7.920953635994321e-06, "optim/total_tokens": 1986153938944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.270980715751648, "created_at": "2025-06-03T09:21:21.316408+00:00"} {"global_step": 236769, "acc_step": 0, "speed/wps": 5516.02244699365, "speed/FLOPS": 243779958594801.22, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04815578833222389, "optim/lr": 7.917406410899997e-06, "optim/total_tokens": 1986162327552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2457284927368164, "created_at": "2025-06-03T09:21:24.290970+00:00"} {"global_step": 236770, "acc_step": 0, "speed/wps": 5508.90598682903, "speed/FLOPS": 243465447480870.16, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05287735536694527, "optim/lr": 7.91385918580545e-06, "optim/total_tokens": 1986170716160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2585872411727905, "created_at": "2025-06-03T09:21:27.272059+00:00"} {"global_step": 236771, "acc_step": 0, "speed/wps": 5522.8927217383625, "speed/FLOPS": 244083589573263.53, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04678947851061821, "optim/lr": 7.910311960710903e-06, "optim/total_tokens": 1986179104768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2562589645385742, "created_at": "2025-06-03T09:21:30.244275+00:00"} {"global_step": 236772, "acc_step": 0, "speed/wps": 5527.403884279334, "speed/FLOPS": 244282959867351.44, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04929843917489052, "optim/lr": 7.906764735616356e-06, "optim/total_tokens": 1986187493376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2688905000686646, "created_at": "2025-06-03T09:21:33.213983+00:00"} {"global_step": 236773, "acc_step": 0, "speed/wps": 5516.743733214852, "speed/FLOPS": 243811835753900.78, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.84 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.84, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04655567556619644, "optim/lr": 7.903217510522032e-06, "optim/total_tokens": 1986195881984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2842364311218262, "created_at": "2025-06-03T09:21:36.192428+00:00"} {"global_step": 236774, "acc_step": 0, "speed/wps": 5527.409558489298, "speed/FLOPS": 244283210638388.6, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04868719354271889, "optim/lr": 7.899670285427485e-06, "optim/total_tokens": 1986204270592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.261839747428894, "created_at": "2025-06-03T09:21:39.160960+00:00"} {"global_step": 236775, "acc_step": 0, "speed/wps": 5515.635452231081, "speed/FLOPS": 243762855407114.4, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0469585619866848, "optim/lr": 7.896123060332939e-06, "optim/total_tokens": 1986212659200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2755897045135498, "created_at": "2025-06-03T09:21:42.140397+00:00"} {"global_step": 236776, "acc_step": 0, "speed/wps": 5514.676722103113, "speed/FLOPS": 243720484442683.88, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04772739112377167, "optim/lr": 7.89257583523839e-06, "optim/total_tokens": 1986221047808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2649757862091064, "created_at": "2025-06-03T09:21:45.122568+00:00"} {"global_step": 236777, "acc_step": 0, "speed/wps": 5519.543604802509, "speed/FLOPS": 243935575747033.3, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048304881900548935, "optim/lr": 7.889028610144066e-06, "optim/total_tokens": 1986229436416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2621073722839355, "created_at": "2025-06-03T09:21:48.098532+00:00"} {"global_step": 236778, "acc_step": 0, "speed/wps": 5510.975502983899, "speed/FLOPS": 243556909502171.44, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04846211522817612, "optim/lr": 7.88548138504952e-06, "optim/total_tokens": 1986237825024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2584131956100464, "created_at": "2025-06-03T09:21:51.076747+00:00"} {"global_step": 236779, "acc_step": 0, "speed/wps": 5525.693682936171, "speed/FLOPS": 244207377721587.62, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0466119684278965, "optim/lr": 7.881934159954974e-06, "optim/total_tokens": 1986246213632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2590508460998535, "created_at": "2025-06-03T09:21:54.046010+00:00"} {"global_step": 236780, "acc_step": 0, "speed/wps": 5526.310278774045, "speed/FLOPS": 244234628101598.06, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047592852264642715, "optim/lr": 7.878386934860427e-06, "optim/total_tokens": 1986254602240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2435933351516724, "created_at": "2025-06-03T09:21:57.019964+00:00"} {"global_step": 236781, "acc_step": 0, "speed/wps": 5520.0554755805015, "speed/FLOPS": 243958197815428.4, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04653085023164749, "optim/lr": 7.874839709766101e-06, "optim/total_tokens": 1986262990848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2617906332015991, "created_at": "2025-06-03T09:21:59.995173+00:00"} {"global_step": 236782, "acc_step": 0, "speed/wps": 5523.197806485817, "speed/FLOPS": 244097072757535.72, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04728009179234505, "optim/lr": 7.871292484671555e-06, "optim/total_tokens": 1986271379456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.264821171760559, "created_at": "2025-06-03T09:22:02.965973+00:00"} {"global_step": 236783, "acc_step": 0, "speed/wps": 5515.590747063526, "speed/FLOPS": 243760879667530.25, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04981982335448265, "optim/lr": 7.867745259577008e-06, "optim/total_tokens": 1986279768064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2708146572113037, "created_at": "2025-06-03T09:22:05.942983+00:00"} {"global_step": 236784, "acc_step": 0, "speed/wps": 5520.396600985042, "speed/FLOPS": 243973273812271.0, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04660620912909508, "optim/lr": 7.864198034482684e-06, "optim/total_tokens": 1986288156672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.253989815711975, "created_at": "2025-06-03T09:22:08.918184+00:00"} {"global_step": 236785, "acc_step": 0, "speed/wps": 5514.427095769365, "speed/FLOPS": 243709452236435.62, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04810844361782074, "optim/lr": 7.860650809388137e-06, "optim/total_tokens": 1986296545280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2664482593536377, "created_at": "2025-06-03T09:22:11.897946+00:00"} {"global_step": 236786, "acc_step": 0, "speed/wps": 5529.385058533499, "speed/FLOPS": 244370517628816.44, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.048503328114748, "optim/lr": 7.85710358429359e-06, "optim/total_tokens": 1986304933888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2675938606262207, "created_at": "2025-06-03T09:22:14.866003+00:00"} {"global_step": 236787, "acc_step": 0, "speed/wps": 5510.253852005179, "speed/FLOPS": 243525016222656.6, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.83 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.83, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04939702898263931, "optim/lr": 7.853556359199043e-06, "optim/total_tokens": 1986313322496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2539907693862915, "created_at": "2025-06-03T09:22:17.843733+00:00"} {"global_step": 236788, "acc_step": 0, "speed/wps": 5527.939395808882, "speed/FLOPS": 244306626735960.97, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04832928255200386, "optim/lr": 7.850009134104718e-06, "optim/total_tokens": 1986321711104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2532010078430176, "created_at": "2025-06-03T09:22:20.814407+00:00"} {"global_step": 236789, "acc_step": 0, "speed/wps": 5521.791217194188, "speed/FLOPS": 244034908710422.38, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04783356562256813, "optim/lr": 7.846461909010172e-06, "optim/total_tokens": 1986330099712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2536910772323608, "created_at": "2025-06-03T09:22:23.791464+00:00"} {"global_step": 236790, "acc_step": 0, "speed/wps": 5521.585531851919, "speed/FLOPS": 244025818471087.1, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04672779515385628, "optim/lr": 7.842914683915626e-06, "optim/total_tokens": 1986338488320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.260890007019043, "created_at": "2025-06-03T09:22:26.767011+00:00"} {"global_step": 236791, "acc_step": 0, "speed/wps": 5517.591847594853, "speed/FLOPS": 243849318068453.88, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047339584678411484, "optim/lr": 7.83936745882108e-06, "optim/total_tokens": 1986346876928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2584525346755981, "created_at": "2025-06-03T09:22:29.742854+00:00"} {"global_step": 236792, "acc_step": 0, "speed/wps": 5519.43422627408, "speed/FLOPS": 243930741775926.78, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047237690538167953, "optim/lr": 7.835820233726753e-06, "optim/total_tokens": 1986355265536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2322280406951904, "created_at": "2025-06-03T09:22:32.718699+00:00"} {"global_step": 236793, "acc_step": 0, "speed/wps": 5505.453644577235, "speed/FLOPS": 243312871624030.34, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04782895743846893, "optim/lr": 7.832273008632207e-06, "optim/total_tokens": 1986363654144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2606921195983887, "created_at": "2025-06-03T09:22:35.703001+00:00"} {"global_step": 236794, "acc_step": 0, "speed/wps": 5506.585826263069, "speed/FLOPS": 243362908259513.0, "speed/curr_iter_time": 2.9745, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9745, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04765019938349724, "optim/lr": 7.82872578353766e-06, "optim/total_tokens": 1986372042752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.254852533340454, "created_at": "2025-06-03T09:22:38.685089+00:00"} {"global_step": 236795, "acc_step": 0, "speed/wps": 5508.529114389553, "speed/FLOPS": 243448791648053.28, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0478803850710392, "optim/lr": 7.825178558443114e-06, "optim/total_tokens": 1986380431360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.253278374671936, "created_at": "2025-06-03T09:22:41.667930+00:00"} {"global_step": 236796, "acc_step": 0, "speed/wps": 5520.079041015232, "speed/FLOPS": 243959239287024.66, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0471280999481678, "optim/lr": 7.82163133334879e-06, "optim/total_tokens": 1986388819968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.251409649848938, "created_at": "2025-06-03T09:22:44.640305+00:00"} {"global_step": 236797, "acc_step": 0, "speed/wps": 5521.07169178736, "speed/FLOPS": 244003109370305.47, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.0472845695912838, "optim/lr": 7.818084108254241e-06, "optim/total_tokens": 1986397208576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2675864696502686, "created_at": "2025-06-03T09:22:47.612267+00:00"} {"global_step": 236798, "acc_step": 0, "speed/wps": 5511.339808121391, "speed/FLOPS": 243573009924565.84, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046695586293935776, "optim/lr": 7.814536883159695e-06, "optim/total_tokens": 1986405597184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.274966835975647, "created_at": "2025-06-03T09:22:50.594404+00:00"} {"global_step": 236799, "acc_step": 0, "speed/wps": 5506.727081680948, "speed/FLOPS": 243369151025972.47, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046559832990169525, "optim/lr": 7.810989658065148e-06, "optim/total_tokens": 1986413985792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2759641408920288, "created_at": "2025-06-03T09:22:53.579746+00:00"} {"global_step": 236800, "acc_step": 0, "speed/wps": 5502.784963476609, "speed/FLOPS": 243194929578930.8, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.82 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.82, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046786416321992874, "optim/lr": 7.807442432970824e-06, "optim/total_tokens": 1986422374400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2546772956848145, "created_at": "2025-06-03T09:22:56.562167+00:00"} {"global_step": 236801, "acc_step": 0, "speed/wps": 5514.980500854514, "speed/FLOPS": 243733909908615.2, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04643046855926514, "optim/lr": 7.803895207876278e-06, "optim/total_tokens": 1986430763008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2694239616394043, "created_at": "2025-06-03T09:22:59.537322+00:00"} {"global_step": 236802, "acc_step": 0, "speed/wps": 5514.124901957205, "speed/FLOPS": 243696096816706.28, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04905617982149124, "optim/lr": 7.80034798278173e-06, "optim/total_tokens": 1986439151616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2574520111083984, "created_at": "2025-06-03T09:23:02.517053+00:00"} {"global_step": 236803, "acc_step": 0, "speed/wps": 5514.4743593808425, "speed/FLOPS": 243711541046145.8, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04782949015498161, "optim/lr": 7.796800757687183e-06, "optim/total_tokens": 1986447540224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.270674228668213, "created_at": "2025-06-03T09:23:05.496344+00:00"} {"global_step": 236804, "acc_step": 0, "speed/wps": 5525.352945562611, "speed/FLOPS": 244192318873728.25, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04829510673880577, "optim/lr": 7.793253532592859e-06, "optim/total_tokens": 1986455928832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2650619745254517, "created_at": "2025-06-03T09:23:08.468096+00:00"} {"global_step": 236805, "acc_step": 0, "speed/wps": 5536.272292764203, "speed/FLOPS": 244674898129753.03, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 194.61, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04823249578475952, "optim/lr": 7.789706307498312e-06, "optim/total_tokens": 1986464317440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2708642482757568, "created_at": "2025-06-03T09:23:11.432987+00:00"} {"global_step": 236806, "acc_step": 0, "speed/wps": 5540.97898871775, "speed/FLOPS": 244882909999846.06, "speed/curr_iter_time": 2.9548, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9548, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 194.37, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04644361510872841, "optim/lr": 7.786159082403766e-06, "optim/total_tokens": 1986472706048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2494057416915894, "created_at": "2025-06-03T09:23:14.393951+00:00"} {"global_step": 236807, "acc_step": 0, "speed/wps": 5527.49008976207, "speed/FLOPS": 244286769708448.7, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04733472317457199, "optim/lr": 7.782611857309218e-06, "optim/total_tokens": 1986481094656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2703344821929932, "created_at": "2025-06-03T09:23:17.363644+00:00"} {"global_step": 236808, "acc_step": 0, "speed/wps": 5523.135231866178, "speed/FLOPS": 244094307279633.66, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.05011087283492088, "optim/lr": 7.779064632214893e-06, "optim/total_tokens": 1986489483264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2602083683013916, "created_at": "2025-06-03T09:23:20.339089+00:00"} {"global_step": 236809, "acc_step": 0, "speed/wps": 5512.568157829321, "speed/FLOPS": 243627296694392.56, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04903816804289818, "optim/lr": 7.775517407120347e-06, "optim/total_tokens": 1986497871872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2679086923599243, "created_at": "2025-06-03T09:23:23.316905+00:00"} {"global_step": 236810, "acc_step": 0, "speed/wps": 5513.9772558505465, "speed/FLOPS": 243689571614513.25, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04940110072493553, "optim/lr": 7.7719701820258e-06, "optim/total_tokens": 1986506260480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2424837350845337, "created_at": "2025-06-03T09:23:26.297108+00:00"} {"global_step": 236811, "acc_step": 0, "speed/wps": 5512.262477144537, "speed/FLOPS": 243613787172740.72, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04819789156317711, "optim/lr": 7.768422956931476e-06, "optim/total_tokens": 1986514649088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.274258017539978, "created_at": "2025-06-03T09:23:29.277522+00:00"} {"global_step": 236812, "acc_step": 0, "speed/wps": 5508.940324892698, "speed/FLOPS": 243466965047526.16, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04937618598341942, "optim/lr": 7.76487573183693e-06, "optim/total_tokens": 1986523037696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2629923820495605, "created_at": "2025-06-03T09:23:32.256038+00:00"} {"global_step": 236813, "acc_step": 0, "speed/wps": 5506.171806069268, "speed/FLOPS": 243344610686094.47, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.81 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.81, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04734690114855766, "optim/lr": 7.761328506742382e-06, "optim/total_tokens": 1986531426304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2537827491760254, "created_at": "2025-06-03T09:23:35.240083+00:00"} {"global_step": 236814, "acc_step": 0, "speed/wps": 5514.484215305653, "speed/FLOPS": 243711976627575.28, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.047108739614486694, "optim/lr": 7.757781281647835e-06, "optim/total_tokens": 1986539814912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2735902070999146, "created_at": "2025-06-03T09:23:38.216833+00:00"} {"global_step": 236815, "acc_step": 0, "speed/wps": 5521.141341717044, "speed/FLOPS": 244006187540696.88, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.04808971285820007, "optim/lr": 7.75423405655351e-06, "optim/total_tokens": 1986548203520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2629168033599854, "created_at": "2025-06-03T09:23:41.189120+00:00"} {"global_step": 236816, "acc_step": 0, "speed/wps": 5530.504559151892, "speed/FLOPS": 244419993826025.78, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04671930894255638, "optim/lr": 7.750686831458964e-06, "optim/total_tokens": 1986556592128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2600133419036865, "created_at": "2025-06-03T09:23:44.161174+00:00"} {"global_step": 236817, "acc_step": 0, "speed/wps": 5521.3951101631865, "speed/FLOPS": 244017402807111.7, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04680138826370239, "optim/lr": 7.747139606364418e-06, "optim/total_tokens": 1986564980736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2933305501937866, "created_at": "2025-06-03T09:23:47.136372+00:00"} {"global_step": 236818, "acc_step": 0, "speed/wps": 5534.787995405586, "speed/FLOPS": 244609299783824.78, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 194.68, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04665270820260048, "optim/lr": 7.74359238126987e-06, "optim/total_tokens": 1986573369344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2788082361221313, "created_at": "2025-06-03T09:23:50.103768+00:00"} {"global_step": 236819, "acc_step": 0, "speed/wps": 5518.311903365366, "speed/FLOPS": 243881140847931.0, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046701546758413315, "optim/lr": 7.740045156175545e-06, "optim/total_tokens": 1986581757952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2625031471252441, "created_at": "2025-06-03T09:23:53.078627+00:00"} {"global_step": 236820, "acc_step": 0, "speed/wps": 5509.771213974633, "speed/FLOPS": 243503686092071.8, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.8 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.8, "speed/est_time_remaining_days": 0.08, "optim/grad_norm": 0.046985968947410583, "optim/lr": 7.736497931080999e-06, "optim/total_tokens": 1986590146560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2600911855697632, "created_at": "2025-06-03T09:23:56.056725+00:00"} {"global_step": 236821, "acc_step": 0, "speed/wps": 5534.554169763489, "speed/FLOPS": 244598965887272.22, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 194.69, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04754646494984627, "optim/lr": 7.732950705986453e-06, "optim/total_tokens": 1986598535168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2624542713165283, "created_at": "2025-06-03T09:23:59.023741+00:00"} {"global_step": 236822, "acc_step": 0, "speed/wps": 5524.65853123849, "speed/FLOPS": 244161629314936.8, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04699311777949333, "optim/lr": 7.729403480891906e-06, "optim/total_tokens": 1986606923776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2667657136917114, "created_at": "2025-06-03T09:24:01.994564+00:00"} {"global_step": 236823, "acc_step": 0, "speed/wps": 5522.7786510076085, "speed/FLOPS": 244078548230831.16, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04995295777916908, "optim/lr": 7.725856255797582e-06, "optim/total_tokens": 1986615312384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2697415351867676, "created_at": "2025-06-03T09:24:04.970690+00:00"} {"global_step": 236824, "acc_step": 0, "speed/wps": 5531.562816278389, "speed/FLOPS": 244466763374365.9, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04737360402941704, "optim/lr": 7.722309030703034e-06, "optim/total_tokens": 1986623700992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.279757022857666, "created_at": "2025-06-03T09:24:07.941712+00:00"} {"global_step": 236825, "acc_step": 0, "speed/wps": 5522.6599373381905, "speed/FLOPS": 244073301694274.5, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046567656099796295, "optim/lr": 7.718761805608487e-06, "optim/total_tokens": 1986632089600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2611336708068848, "created_at": "2025-06-03T09:24:10.914064+00:00"} {"global_step": 236826, "acc_step": 0, "speed/wps": 5520.007327304242, "speed/FLOPS": 243956069908062.94, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049229469150304794, "optim/lr": 7.71521458051394e-06, "optim/total_tokens": 1986640478208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.26313054561615, "created_at": "2025-06-03T09:24:13.890277+00:00"} {"global_step": 236827, "acc_step": 0, "speed/wps": 5514.475013214725, "speed/FLOPS": 243711569942256.78, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04686926305294037, "optim/lr": 7.711667355419616e-06, "optim/total_tokens": 1986648866816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2728468179702759, "created_at": "2025-06-03T09:24:16.865929+00:00"} {"global_step": 236828, "acc_step": 0, "speed/wps": 5508.735282288584, "speed/FLOPS": 243457903213927.5, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04759646952152252, "optim/lr": 7.70812013032507e-06, "optim/total_tokens": 1986657255424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.257859468460083, "created_at": "2025-06-03T09:24:19.844322+00:00"} {"global_step": 236829, "acc_step": 0, "speed/wps": 5511.984326029328, "speed/FLOPS": 243601494317154.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04740116000175476, "optim/lr": 7.704572905230522e-06, "optim/total_tokens": 1986665644032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.277159333229065, "created_at": "2025-06-03T09:24:22.823833+00:00"} {"global_step": 236830, "acc_step": 0, "speed/wps": 5527.058808360803, "speed/FLOPS": 244267709278011.0, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04830804094672203, "optim/lr": 7.701025680135975e-06, "optim/total_tokens": 1986674032640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2715588808059692, "created_at": "2025-06-03T09:24:25.795560+00:00"} {"global_step": 236831, "acc_step": 0, "speed/wps": 5524.73685046752, "speed/FLOPS": 244165090623985.78, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04709189385175705, "optim/lr": 7.697478455041651e-06, "optim/total_tokens": 1986682421248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2606756687164307, "created_at": "2025-06-03T09:24:28.765543+00:00"} {"global_step": 236832, "acc_step": 0, "speed/wps": 5522.27716386916, "speed/FLOPS": 244056385066155.6, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04974560812115669, "optim/lr": 7.693931229947105e-06, "optim/total_tokens": 1986690809856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2769107818603516, "created_at": "2025-06-03T09:24:31.739717+00:00"} {"global_step": 236833, "acc_step": 0, "speed/wps": 5521.583119898929, "speed/FLOPS": 244025711875110.44, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04946701601147652, "optim/lr": 7.690384004852558e-06, "optim/total_tokens": 1986699198464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2629286050796509, "created_at": "2025-06-03T09:24:34.712279+00:00"} {"global_step": 236834, "acc_step": 0, "speed/wps": 5522.160554001107, "speed/FLOPS": 244051231506851.06, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04745404049754143, "optim/lr": 7.68683677975801e-06, "optim/total_tokens": 1986707587072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2622507810592651, "created_at": "2025-06-03T09:24:37.687784+00:00"} {"global_step": 236835, "acc_step": 0, "speed/wps": 5516.132725082564, "speed/FLOPS": 243784832321876.78, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04976898804306984, "optim/lr": 7.683289554663686e-06, "optim/total_tokens": 1986715975680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2650632858276367, "created_at": "2025-06-03T09:24:40.662971+00:00"} {"global_step": 236836, "acc_step": 0, "speed/wps": 5528.146915004125, "speed/FLOPS": 244315798022211.16, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0477936677634716, "optim/lr": 7.67974232956914e-06, "optim/total_tokens": 1986724364288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2593531608581543, "created_at": "2025-06-03T09:24:43.634497+00:00"} {"global_step": 236837, "acc_step": 0, "speed/wps": 5500.787258718753, "speed/FLOPS": 243106641253813.47, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.79 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.79, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046536583453416824, "optim/lr": 7.676195104474593e-06, "optim/total_tokens": 1986732752896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2649701833724976, "created_at": "2025-06-03T09:24:46.620698+00:00"} {"global_step": 236838, "acc_step": 0, "speed/wps": 5521.932695691095, "speed/FLOPS": 244041161335833.1, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050822366029024124, "optim/lr": 7.672647879380268e-06, "optim/total_tokens": 1986741141504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2699710130691528, "created_at": "2025-06-03T09:24:49.596402+00:00"} {"global_step": 236839, "acc_step": 0, "speed/wps": 5523.9838279560145, "speed/FLOPS": 244131810883295.88, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04703858122229576, "optim/lr": 7.66910065428572e-06, "optim/total_tokens": 1986749530112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2634176015853882, "created_at": "2025-06-03T09:24:52.567043+00:00"} {"global_step": 236840, "acc_step": 0, "speed/wps": 5527.078935473671, "speed/FLOPS": 244268598793379.88, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046752411872148514, "optim/lr": 7.665553429191174e-06, "optim/total_tokens": 1986757918720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2517753839492798, "created_at": "2025-06-03T09:24:55.540435+00:00"} {"global_step": 236841, "acc_step": 0, "speed/wps": 5520.01479459899, "speed/FLOPS": 243956399924269.75, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05016050860285759, "optim/lr": 7.662006204096628e-06, "optim/total_tokens": 1986766307328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2663594484329224, "created_at": "2025-06-03T09:24:58.513510+00:00"} {"global_step": 236842, "acc_step": 0, "speed/wps": 5523.623184143025, "speed/FLOPS": 244115872272704.12, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049267739057540894, "optim/lr": 7.658458979002303e-06, "optim/total_tokens": 1986774695936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2598823308944702, "created_at": "2025-06-03T09:25:01.485748+00:00"} {"global_step": 236843, "acc_step": 0, "speed/wps": 5526.356119207841, "speed/FLOPS": 244236654014139.25, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04642337188124657, "optim/lr": 7.654911753907757e-06, "optim/total_tokens": 1986783084544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2610214948654175, "created_at": "2025-06-03T09:25:04.455784+00:00"} {"global_step": 236844, "acc_step": 0, "speed/wps": 5516.637558309632, "speed/FLOPS": 243807143366542.5, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05443308874964714, "optim/lr": 7.65136452881321e-06, "optim/total_tokens": 1986791473152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2577534914016724, "created_at": "2025-06-03T09:25:07.432661+00:00"} {"global_step": 236845, "acc_step": 0, "speed/wps": 5521.44967203753, "speed/FLOPS": 244019814162684.7, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047011781483888626, "optim/lr": 7.647817303718662e-06, "optim/total_tokens": 1986799861760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2680679559707642, "created_at": "2025-06-03T09:25:10.409133+00:00"} {"global_step": 236846, "acc_step": 0, "speed/wps": 5523.144758965888, "speed/FLOPS": 244094728328676.72, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04765023663640022, "optim/lr": 7.644270078624338e-06, "optim/total_tokens": 1986808250368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2661112546920776, "created_at": "2025-06-03T09:25:13.382270+00:00"} {"global_step": 236847, "acc_step": 0, "speed/wps": 5531.460880935986, "speed/FLOPS": 244462258353984.1, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.052211079746484756, "optim/lr": 7.640722853529791e-06, "optim/total_tokens": 1986816638976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2551922798156738, "created_at": "2025-06-03T09:25:16.348151+00:00"} {"global_step": 236848, "acc_step": 0, "speed/wps": 5520.357968576438, "speed/FLOPS": 243971566457549.28, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04999212175607681, "optim/lr": 7.637175628435245e-06, "optim/total_tokens": 1986825027584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2698991298675537, "created_at": "2025-06-03T09:25:19.320611+00:00"} {"global_step": 236849, "acc_step": 0, "speed/wps": 5503.469273770598, "speed/FLOPS": 243225172591307.53, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.78 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.78, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046324584633111954, "optim/lr": 7.633628403340699e-06, "optim/total_tokens": 1986833416192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2534334659576416, "created_at": "2025-06-03T09:25:22.301806+00:00"} {"global_step": 236850, "acc_step": 0, "speed/wps": 5525.177900615462, "speed/FLOPS": 244184582783025.53, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04894920065999031, "optim/lr": 7.630081178246372e-06, "optim/total_tokens": 1986841804800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2728025913238525, "created_at": "2025-06-03T09:25:25.275966+00:00"} {"global_step": 236851, "acc_step": 0, "speed/wps": 5529.36170076799, "speed/FLOPS": 244369485335136.8, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050765808671712875, "optim/lr": 7.626533953151826e-06, "optim/total_tokens": 1986850193408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.25597083568573, "created_at": "2025-06-03T09:25:28.243650+00:00"} {"global_step": 236852, "acc_step": 0, "speed/wps": 5516.41962097295, "speed/FLOPS": 243797511651765.53, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046063151210546494, "optim/lr": 7.62298672805728e-06, "optim/total_tokens": 1986858582016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2735146284103394, "created_at": "2025-06-03T09:25:31.219173+00:00"} {"global_step": 236853, "acc_step": 0, "speed/wps": 5512.659465677742, "speed/FLOPS": 243631332033936.88, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046830836683511734, "optim/lr": 7.619439502962733e-06, "optim/total_tokens": 1986866970624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2737659215927124, "created_at": "2025-06-03T09:25:34.197703+00:00"} {"global_step": 236854, "acc_step": 0, "speed/wps": 5524.713271272364, "speed/FLOPS": 244164048544249.16, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046847593039274216, "optim/lr": 7.615892277868408e-06, "optim/total_tokens": 1986875359232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2582539319992065, "created_at": "2025-06-03T09:25:37.170717+00:00"} {"global_step": 236855, "acc_step": 0, "speed/wps": 5528.14321442558, "speed/FLOPS": 244315634475580.75, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04870113357901573, "optim/lr": 7.6123450527738615e-06, "optim/total_tokens": 1986883747840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.263258934020996, "created_at": "2025-06-03T09:25:40.138653+00:00"} {"global_step": 236856, "acc_step": 0, "speed/wps": 5524.128734150766, "speed/FLOPS": 244138214995406.75, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048368968069553375, "optim/lr": 7.608797827679314e-06, "optim/total_tokens": 1986892136448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2767375707626343, "created_at": "2025-06-03T09:25:43.108808+00:00"} {"global_step": 236857, "acc_step": 0, "speed/wps": 5527.574901113137, "speed/FLOPS": 244290517936061.97, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04725470021367073, "optim/lr": 7.605250602584768e-06, "optim/total_tokens": 1986900525056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2518093585968018, "created_at": "2025-06-03T09:25:46.077468+00:00"} {"global_step": 236858, "acc_step": 0, "speed/wps": 5520.314750168287, "speed/FLOPS": 243969656425120.88, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05214865878224373, "optim/lr": 7.601703377490443e-06, "optim/total_tokens": 1986908913664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.286128282546997, "created_at": "2025-06-03T09:25:49.049761+00:00"} {"global_step": 236859, "acc_step": 0, "speed/wps": 5517.439474672204, "speed/FLOPS": 243842583965188.12, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.051198724657297134, "optim/lr": 7.598156152395896e-06, "optim/total_tokens": 1986917302272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2672436237335205, "created_at": "2025-06-03T09:25:52.023366+00:00"} {"global_step": 236860, "acc_step": 0, "speed/wps": 5504.888186937606, "speed/FLOPS": 243287881290633.34, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04666585847735405, "optim/lr": 7.59460892730135e-06, "optim/total_tokens": 1986925690880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2569921016693115, "created_at": "2025-06-03T09:25:55.004111+00:00"} {"global_step": 236861, "acc_step": 0, "speed/wps": 5512.908351528134, "speed/FLOPS": 243642331514610.9, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.77 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.77, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04798484593629837, "optim/lr": 7.591061702206803e-06, "optim/total_tokens": 1986934079488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.252875566482544, "created_at": "2025-06-03T09:25:57.980696+00:00"} {"global_step": 236862, "acc_step": 0, "speed/wps": 5513.749892628754, "speed/FLOPS": 243679523323860.53, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.45, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04718652740120888, "optim/lr": 7.587514477112478e-06, "optim/total_tokens": 1986942468096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2565525770187378, "created_at": "2025-06-03T09:26:00.956436+00:00"} {"global_step": 236863, "acc_step": 0, "speed/wps": 5515.979799301249, "speed/FLOPS": 243778073785087.75, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047308389097452164, "optim/lr": 7.583967252017932e-06, "optim/total_tokens": 1986950856704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.271248698234558, "created_at": "2025-06-03T09:26:03.932274+00:00"} {"global_step": 236864, "acc_step": 0, "speed/wps": 5520.299641185949, "speed/FLOPS": 243968988685436.34, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04721726104617119, "optim/lr": 7.580420026923384e-06, "optim/total_tokens": 1986959245312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2613469362258911, "created_at": "2025-06-03T09:26:06.907463+00:00"} {"global_step": 236865, "acc_step": 0, "speed/wps": 5525.405363027316, "speed/FLOPS": 244194635457371.28, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047443728893995285, "optim/lr": 7.57687280182906e-06, "optim/total_tokens": 1986967633920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2588095664978027, "created_at": "2025-06-03T09:26:09.878625+00:00"} {"global_step": 236866, "acc_step": 0, "speed/wps": 5513.258989070246, "speed/FLOPS": 243657827899246.62, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046200238168239594, "optim/lr": 7.5733255767345135e-06, "optim/total_tokens": 1986976022528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2526075839996338, "created_at": "2025-06-03T09:26:12.857418+00:00"} {"global_step": 236867, "acc_step": 0, "speed/wps": 5516.81477739703, "speed/FLOPS": 243814975543115.97, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04653783142566681, "optim/lr": 7.569778351639966e-06, "optim/total_tokens": 1986984411136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.261601448059082, "created_at": "2025-06-03T09:26:15.831573+00:00"} {"global_step": 236868, "acc_step": 0, "speed/wps": 5520.432020059104, "speed/FLOPS": 243974839154053.25, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04652881249785423, "optim/lr": 7.56623112654542e-06, "optim/total_tokens": 1986992799744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2569466829299927, "created_at": "2025-06-03T09:26:18.803802+00:00"} {"global_step": 236869, "acc_step": 0, "speed/wps": 5517.8304120127, "speed/FLOPS": 243859861394639.38, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0498165600001812, "optim/lr": 7.562683901451095e-06, "optim/total_tokens": 1987001188352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2650117874145508, "created_at": "2025-06-03T09:26:21.781814+00:00"} {"global_step": 236870, "acc_step": 0, "speed/wps": 5517.030607889121, "speed/FLOPS": 243824514146145.75, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.76 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.76, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047272082418203354, "optim/lr": 7.559136676356548e-06, "optim/total_tokens": 1987009576960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2477059364318848, "created_at": "2025-06-03T09:26:24.756438+00:00"} {"global_step": 236871, "acc_step": 0, "speed/wps": 5520.100535486074, "speed/FLOPS": 243960189232617.2, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05077674984931946, "optim/lr": 7.555589451262002e-06, "optim/total_tokens": 1987017965568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2595264911651611, "created_at": "2025-06-03T09:26:27.728903+00:00"} {"global_step": 236872, "acc_step": 0, "speed/wps": 5521.888853359325, "speed/FLOPS": 244039223729174.25, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04662314057350159, "optim/lr": 7.5520422261674545e-06, "optim/total_tokens": 1987026354176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2756071090698242, "created_at": "2025-06-03T09:26:30.702653+00:00"} {"global_step": 236873, "acc_step": 0, "speed/wps": 5521.699178949318, "speed/FLOPS": 244030841091093.56, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04756033420562744, "optim/lr": 7.54849500107313e-06, "optim/total_tokens": 1987034742784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2681727409362793, "created_at": "2025-06-03T09:26:33.674250+00:00"} {"global_step": 236874, "acc_step": 0, "speed/wps": 5530.83268174416, "speed/FLOPS": 244434495165120.34, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050801049917936325, "optim/lr": 7.544947775978584e-06, "optim/total_tokens": 1987043131392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2634116411209106, "created_at": "2025-06-03T09:26:36.645249+00:00"} {"global_step": 236875, "acc_step": 0, "speed/wps": 5520.450843867638, "speed/FLOPS": 243975671070041.47, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0465133935213089, "optim/lr": 7.5414005508840364e-06, "optim/total_tokens": 1987051520000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2659918069839478, "created_at": "2025-06-03T09:26:39.617456+00:00"} {"global_step": 236876, "acc_step": 0, "speed/wps": 5514.070785046061, "speed/FLOPS": 243693705126229.2, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04867169260978699, "optim/lr": 7.53785332578949e-06, "optim/total_tokens": 1987059908608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2721909284591675, "created_at": "2025-06-03T09:26:42.596389+00:00"} {"global_step": 236877, "acc_step": 0, "speed/wps": 5505.421895126343, "speed/FLOPS": 243311468460809.34, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04763702303171158, "optim/lr": 7.5343061006951656e-06, "optim/total_tokens": 1987068297216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2547146081924438, "created_at": "2025-06-03T09:26:45.576789+00:00"} {"global_step": 236878, "acc_step": 0, "speed/wps": 5516.914256253556, "speed/FLOPS": 243819371999395.47, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04716473072767258, "optim/lr": 7.530758875600618e-06, "optim/total_tokens": 1987076685824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2733441591262817, "created_at": "2025-06-03T09:26:48.551570+00:00"} {"global_step": 236879, "acc_step": 0, "speed/wps": 5517.028675712661, "speed/FLOPS": 243824428753836.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04639221355319023, "optim/lr": 7.527211650506072e-06, "optim/total_tokens": 1987085074432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.270566701889038, "created_at": "2025-06-03T09:26:51.525424+00:00"} {"global_step": 236880, "acc_step": 0, "speed/wps": 5528.1067039954305, "speed/FLOPS": 244314020901445.47, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04966643080115318, "optim/lr": 7.523664425411525e-06, "optim/total_tokens": 1987093463040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2755264043807983, "created_at": "2025-06-03T09:26:54.494178+00:00"} {"global_step": 236881, "acc_step": 0, "speed/wps": 5517.721703192684, "speed/FLOPS": 243855057021216.8, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04688858985900879, "optim/lr": 7.5201172003172e-06, "optim/total_tokens": 1987101851648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.270713210105896, "created_at": "2025-06-03T09:26:57.467813+00:00"} {"global_step": 236882, "acc_step": 0, "speed/wps": 5506.953423476803, "speed/FLOPS": 243379154174826.97, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05015721172094345, "optim/lr": 7.516569975222654e-06, "optim/total_tokens": 1987110240256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2691022157669067, "created_at": "2025-06-03T09:27:00.449314+00:00"} {"global_step": 236883, "acc_step": 0, "speed/wps": 5517.14845374709, "speed/FLOPS": 243829722329878.2, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.75 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.75, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04851481691002846, "optim/lr": 7.513022750128107e-06, "optim/total_tokens": 1987118628864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2695519924163818, "created_at": "2025-06-03T09:27:03.423910+00:00"} {"global_step": 236884, "acc_step": 0, "speed/wps": 5526.278972723305, "speed/FLOPS": 244233244534394.22, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04894331097602844, "optim/lr": 7.50947552503356e-06, "optim/total_tokens": 1987127017472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2632966041564941, "created_at": "2025-06-03T09:27:06.397819+00:00"} {"global_step": 236885, "acc_step": 0, "speed/wps": 5536.577445254302, "speed/FLOPS": 244688384307903.4, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05016327276825905, "optim/lr": 7.505928299939236e-06, "optim/total_tokens": 1987135406080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2680803537368774, "created_at": "2025-06-03T09:27:09.362473+00:00"} {"global_step": 236886, "acc_step": 0, "speed/wps": 5519.14821191384, "speed/FLOPS": 243918101405158.38, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04955320060253143, "optim/lr": 7.5023810748446885e-06, "optim/total_tokens": 1987143794688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2570048570632935, "created_at": "2025-06-03T09:27:12.336600+00:00"} {"global_step": 236887, "acc_step": 0, "speed/wps": 5516.78974032263, "speed/FLOPS": 243813869032578.8, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04675658792257309, "optim/lr": 7.498833849750142e-06, "optim/total_tokens": 1987152183296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2547253370285034, "created_at": "2025-06-03T09:27:15.311405+00:00"} {"global_step": 236888, "acc_step": 0, "speed/wps": 5520.0076602901645, "speed/FLOPS": 243956084624336.34, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04949307069182396, "optim/lr": 7.495286624655595e-06, "optim/total_tokens": 1987160571904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2559919357299805, "created_at": "2025-06-03T09:27:18.284916+00:00"} {"global_step": 236889, "acc_step": 0, "speed/wps": 5524.789680896537, "speed/FLOPS": 244167425458537.7, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04714428260922432, "optim/lr": 7.49173939956127e-06, "optim/total_tokens": 1987168960512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2659151554107666, "created_at": "2025-06-03T09:27:21.255665+00:00"} {"global_step": 236890, "acc_step": 0, "speed/wps": 5524.8341509885995, "speed/FLOPS": 244169390808988.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048537127673625946, "optim/lr": 7.488192174466724e-06, "optim/total_tokens": 1987177349120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2817398309707642, "created_at": "2025-06-03T09:27:24.225825+00:00"} {"global_step": 236891, "acc_step": 0, "speed/wps": 5528.190801177356, "speed/FLOPS": 244317737566438.16, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04850973188877106, "optim/lr": 7.484644949372177e-06, "optim/total_tokens": 1987185737728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2719749212265015, "created_at": "2025-06-03T09:27:27.195391+00:00"} {"global_step": 236892, "acc_step": 0, "speed/wps": 5532.068537775435, "speed/FLOPS": 244489113676018.1, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 194.83, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04628808796405792, "optim/lr": 7.48109772427763e-06, "optim/total_tokens": 1987194126336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2628506422042847, "created_at": "2025-06-03T09:27:30.164441+00:00"} {"global_step": 236893, "acc_step": 0, "speed/wps": 5526.415038619119, "speed/FLOPS": 244239257950540.8, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04750336334109306, "optim/lr": 7.477550499183305e-06, "optim/total_tokens": 1987202514944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2673414945602417, "created_at": "2025-06-03T09:27:33.136391+00:00"} {"global_step": 236894, "acc_step": 0, "speed/wps": 5518.255509397173, "speed/FLOPS": 243878648523187.4, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0466170497238636, "optim/lr": 7.474003274088759e-06, "optim/total_tokens": 1987210903552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2647044658660889, "created_at": "2025-06-03T09:27:36.110390+00:00"} {"global_step": 236895, "acc_step": 0, "speed/wps": 5514.485516063916, "speed/FLOPS": 243712034114432.6, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04693001136183739, "optim/lr": 7.470456048994212e-06, "optim/total_tokens": 1987219292160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2649141550064087, "created_at": "2025-06-03T09:27:39.085889+00:00"} {"global_step": 236896, "acc_step": 0, "speed/wps": 5513.448811087776, "speed/FLOPS": 243666217060824.3, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04817317798733711, "optim/lr": 7.466908823899887e-06, "optim/total_tokens": 1987227680768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2592010498046875, "created_at": "2025-06-03T09:27:42.062074+00:00"} {"global_step": 236897, "acc_step": 0, "speed/wps": 5519.467016389015, "speed/FLOPS": 243932190931171.88, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047885626554489136, "optim/lr": 7.4633615988053405e-06, "optim/total_tokens": 1987236069376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2694382667541504, "created_at": "2025-06-03T09:27:45.039492+00:00"} {"global_step": 236898, "acc_step": 0, "speed/wps": 5505.573898764913, "speed/FLOPS": 243318186243608.97, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.74 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.74, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04661792144179344, "optim/lr": 7.459814373710794e-06, "optim/total_tokens": 1987244457984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2686339616775513, "created_at": "2025-06-03T09:27:48.024267+00:00"} {"global_step": 236899, "acc_step": 0, "speed/wps": 5515.59682677156, "speed/FLOPS": 243761148359506.6, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04661436006426811, "optim/lr": 7.456267148616247e-06, "optim/total_tokens": 1987252846592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.272297978401184, "created_at": "2025-06-03T09:27:51.004725+00:00"} {"global_step": 236900, "acc_step": 0, "speed/wps": 5510.673484513801, "speed/FLOPS": 243543561831663.75, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04738848656415939, "optim/lr": 7.452719923521922e-06, "optim/total_tokens": 1987261235200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2582467794418335, "created_at": "2025-06-03T09:27:53.982858+00:00"} {"global_step": 236901, "acc_step": 0, "speed/wps": 5525.617494321707, "speed/FLOPS": 244204010574797.0, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04672817140817642, "optim/lr": 7.449172698427375e-06, "optim/total_tokens": 1987269623808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2694491147994995, "created_at": "2025-06-03T09:27:56.953829+00:00"} {"global_step": 236902, "acc_step": 0, "speed/wps": 5534.121846721107, "speed/FLOPS": 244579859421628.9, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05038326978683472, "optim/lr": 7.445625473332829e-06, "optim/total_tokens": 1987278012416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2633583545684814, "created_at": "2025-06-03T09:27:59.920434+00:00"} {"global_step": 236903, "acc_step": 0, "speed/wps": 5502.841466411493, "speed/FLOPS": 243197426719444.44, "speed/curr_iter_time": 2.9754, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9754, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04779041185975075, "optim/lr": 7.442078248238282e-06, "optim/total_tokens": 1987286401024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2487173080444336, "created_at": "2025-06-03T09:28:02.903125+00:00"} {"global_step": 236904, "acc_step": 0, "speed/wps": 5518.438094010083, "speed/FLOPS": 243886717828525.25, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.73 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.73, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04758099094033241, "optim/lr": 7.438531023143957e-06, "optim/total_tokens": 1987294789632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.259926438331604, "created_at": "2025-06-03T09:28:05.881721+00:00"} {"global_step": 236905, "acc_step": 0, "speed/wps": 5526.385945714307, "speed/FLOPS": 244237972193059.12, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05085208639502525, "optim/lr": 7.434983798049411e-06, "optim/total_tokens": 1987303178240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2712022066116333, "created_at": "2025-06-03T09:28:08.851560+00:00"} {"global_step": 236906, "acc_step": 0, "speed/wps": 5523.71113792047, "speed/FLOPS": 244119759379478.9, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046672143042087555, "optim/lr": 7.431436572954864e-06, "optim/total_tokens": 1987311566848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2636395692825317, "created_at": "2025-06-03T09:28:11.822327+00:00"} {"global_step": 236907, "acc_step": 0, "speed/wps": 5535.8910013595805, "speed/FLOPS": 244658047001295.06, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 194.62, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.052014950662851334, "optim/lr": 7.427889347860317e-06, "optim/total_tokens": 1987319955456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2730988264083862, "created_at": "2025-06-03T09:28:14.786482+00:00"} {"global_step": 236908, "acc_step": 0, "speed/wps": 5528.626480853454, "speed/FLOPS": 244336992378110.97, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04766395688056946, "optim/lr": 7.4243421227659926e-06, "optim/total_tokens": 1987328344064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2492445707321167, "created_at": "2025-06-03T09:28:17.754884+00:00"} {"global_step": 236909, "acc_step": 0, "speed/wps": 5528.671625197899, "speed/FLOPS": 244338987527065.72, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047780841588974, "optim/lr": 7.420794897671445e-06, "optim/total_tokens": 1987336732672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2600672245025635, "created_at": "2025-06-03T09:28:20.728490+00:00"} {"global_step": 236910, "acc_step": 0, "speed/wps": 5526.203028792536, "speed/FLOPS": 244229888201370.53, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04905451089143753, "optim/lr": 7.417247672576899e-06, "optim/total_tokens": 1987345121280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2651746273040771, "created_at": "2025-06-03T09:28:23.698157+00:00"} {"global_step": 236911, "acc_step": 0, "speed/wps": 5523.1452618305075, "speed/FLOPS": 244094750552718.97, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0470239594578743, "optim/lr": 7.4137004474823525e-06, "optim/total_tokens": 1987353509888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2545570135116577, "created_at": "2025-06-03T09:28:26.672083+00:00"} {"global_step": 236912, "acc_step": 0, "speed/wps": 5518.908301240812, "speed/FLOPS": 243907498581384.7, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04897315055131912, "optim/lr": 7.410153222388027e-06, "optim/total_tokens": 1987361898496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2583377361297607, "created_at": "2025-06-03T09:28:29.646840+00:00"} {"global_step": 236913, "acc_step": 0, "speed/wps": 5517.081434953871, "speed/FLOPS": 243826760442251.25, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04848925769329071, "optim/lr": 7.406605997293481e-06, "optim/total_tokens": 1987370287104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.270220160484314, "created_at": "2025-06-03T09:28:32.625312+00:00"} {"global_step": 236914, "acc_step": 0, "speed/wps": 5515.288876995411, "speed/FLOPS": 243747538555630.66, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046737171709537506, "optim/lr": 7.403058772198934e-06, "optim/total_tokens": 1987378675712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2640990018844604, "created_at": "2025-06-03T09:28:35.605944+00:00"} {"global_step": 236915, "acc_step": 0, "speed/wps": 5523.410189278606, "speed/FLOPS": 244106458989903.3, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048413969576358795, "optim/lr": 7.399511547104387e-06, "optim/total_tokens": 1987387064320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2607179880142212, "created_at": "2025-06-03T09:28:38.576738+00:00"} {"global_step": 236916, "acc_step": 0, "speed/wps": 5519.389006677461, "speed/FLOPS": 243928743301211.1, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.72 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.72, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04821702092885971, "optim/lr": 7.395964322010063e-06, "optim/total_tokens": 1987395452928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2750627994537354, "created_at": "2025-06-03T09:28:41.551852+00:00"} {"global_step": 236917, "acc_step": 0, "speed/wps": 5531.409844670437, "speed/FLOPS": 244460002812274.16, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047150593250989914, "optim/lr": 7.3924170969155155e-06, "optim/total_tokens": 1987403841536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2631431818008423, "created_at": "2025-06-03T09:28:44.518233+00:00"} {"global_step": 236918, "acc_step": 0, "speed/wps": 5523.828334485554, "speed/FLOPS": 244124938867789.22, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05172952637076378, "optim/lr": 7.388869871820969e-06, "optim/total_tokens": 1987412230144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2486553192138672, "created_at": "2025-06-03T09:28:47.493601+00:00"} {"global_step": 236919, "acc_step": 0, "speed/wps": 5531.778937352638, "speed/FLOPS": 244476314819639.8, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04848919436335564, "optim/lr": 7.385322646726423e-06, "optim/total_tokens": 1987420618752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2654004096984863, "created_at": "2025-06-03T09:28:50.464116+00:00"} {"global_step": 236920, "acc_step": 0, "speed/wps": 5522.555358815354, "speed/FLOPS": 244068679858846.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04679718613624573, "optim/lr": 7.381775421632097e-06, "optim/total_tokens": 1987429007360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2669159173965454, "created_at": "2025-06-03T09:28:53.435525+00:00"} {"global_step": 236921, "acc_step": 0, "speed/wps": 5525.117678808691, "speed/FLOPS": 244181921287409.4, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04694831371307373, "optim/lr": 7.378228196537551e-06, "optim/total_tokens": 1987437395968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2602248191833496, "created_at": "2025-06-03T09:28:56.405887+00:00"} {"global_step": 236922, "acc_step": 0, "speed/wps": 5520.754390687094, "speed/FLOPS": 243989086285768.0, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047866977751255035, "optim/lr": 7.374680971443004e-06, "optim/total_tokens": 1987445784576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2645823955535889, "created_at": "2025-06-03T09:28:59.377907+00:00"} {"global_step": 236923, "acc_step": 0, "speed/wps": 5540.495777831769, "speed/FLOPS": 244861554551983.22, "speed/curr_iter_time": 2.9549, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9549, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046472445130348206, "optim/lr": 7.371133746348679e-06, "optim/total_tokens": 1987454173184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2708982229232788, "created_at": "2025-06-03T09:29:02.339381+00:00"} {"global_step": 236924, "acc_step": 0, "speed/wps": 5525.98913582974, "speed/FLOPS": 244220435227218.38, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04810033738613129, "optim/lr": 7.367586521254133e-06, "optim/total_tokens": 1987462561792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.270346760749817, "created_at": "2025-06-03T09:29:05.310884+00:00"} {"global_step": 236925, "acc_step": 0, "speed/wps": 5521.415093804863, "speed/FLOPS": 244018285981788.25, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04650678113102913, "optim/lr": 7.364039296159586e-06, "optim/total_tokens": 1987470950400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2637616395950317, "created_at": "2025-06-03T09:29:08.282905+00:00"} {"global_step": 236926, "acc_step": 0, "speed/wps": 5523.248404767424, "speed/FLOPS": 244099308942597.28, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04695655032992363, "optim/lr": 7.360492071065039e-06, "optim/total_tokens": 1987479339008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2701146602630615, "created_at": "2025-06-03T09:29:11.256517+00:00"} {"global_step": 236927, "acc_step": 0, "speed/wps": 5521.07779398075, "speed/FLOPS": 244003379056019.47, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04815857112407684, "optim/lr": 7.356944845970715e-06, "optim/total_tokens": 1987487727616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.252413272857666, "created_at": "2025-06-03T09:29:14.231991+00:00"} {"global_step": 236928, "acc_step": 0, "speed/wps": 5521.588387898134, "speed/FLOPS": 244025944693711.25, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046960752457380295, "optim/lr": 7.3533976208761675e-06, "optim/total_tokens": 1987496116224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2612146139144897, "created_at": "2025-06-03T09:29:17.208023+00:00"} {"global_step": 236929, "acc_step": 0, "speed/wps": 5516.298370158235, "speed/FLOPS": 243792152986373.1, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.71 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.71, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04706023633480072, "optim/lr": 7.349850395781621e-06, "optim/total_tokens": 1987504504832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.24310302734375, "created_at": "2025-06-03T09:29:20.182469+00:00"} {"global_step": 236930, "acc_step": 0, "speed/wps": 5537.4124576282975, "speed/FLOPS": 244725287580853.22, "speed/curr_iter_time": 2.9567, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9567, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 194.59, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04843417555093765, "optim/lr": 7.346303170687074e-06, "optim/total_tokens": 1987512893440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2753621339797974, "created_at": "2025-06-03T09:29:23.148938+00:00"} {"global_step": 236931, "acc_step": 0, "speed/wps": 5525.822270822196, "speed/FLOPS": 244213060647977.44, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047675721347332, "optim/lr": 7.342755945592749e-06, "optim/total_tokens": 1987521282048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2537047863006592, "created_at": "2025-06-03T09:29:26.119183+00:00"} {"global_step": 236932, "acc_step": 0, "speed/wps": 5530.456790861495, "speed/FLOPS": 244417882712090.53, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04834112524986267, "optim/lr": 7.339208720498203e-06, "optim/total_tokens": 1987529670656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2550605535507202, "created_at": "2025-06-03T09:29:29.088767+00:00"} {"global_step": 236933, "acc_step": 0, "speed/wps": 5522.155126737823, "speed/FLOPS": 244050991649593.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04606802016496658, "optim/lr": 7.335661495403656e-06, "optim/total_tokens": 1987538059264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2707520723342896, "created_at": "2025-06-03T09:29:32.060472+00:00"} {"global_step": 236934, "acc_step": 0, "speed/wps": 5515.607726010064, "speed/FLOPS": 243761630050061.12, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047150619328022, "optim/lr": 7.332114270309109e-06, "optim/total_tokens": 1987546447872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2614192962646484, "created_at": "2025-06-03T09:29:35.037546+00:00"} {"global_step": 236935, "acc_step": 0, "speed/wps": 5519.914154744813, "speed/FLOPS": 243951952157836.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0477619394659996, "optim/lr": 7.328567045214785e-06, "optim/total_tokens": 1987554836480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2600587606430054, "created_at": "2025-06-03T09:29:38.010382+00:00"} {"global_step": 236936, "acc_step": 0, "speed/wps": 5529.375948286305, "speed/FLOPS": 244370115002520.9, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04713276028633118, "optim/lr": 7.325019820120238e-06, "optim/total_tokens": 1987563225088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2707058191299438, "created_at": "2025-06-03T09:29:40.982529+00:00"} {"global_step": 236937, "acc_step": 0, "speed/wps": 5515.494646830243, "speed/FLOPS": 243756632529104.75, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046766068786382675, "optim/lr": 7.321472595025691e-06, "optim/total_tokens": 1987571613696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2635953426361084, "created_at": "2025-06-03T09:29:43.959170+00:00"} {"global_step": 236938, "acc_step": 0, "speed/wps": 5524.432416682326, "speed/FLOPS": 244151636208913.6, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04722709208726883, "optim/lr": 7.317925369931144e-06, "optim/total_tokens": 1987580002304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2616716623306274, "created_at": "2025-06-03T09:29:46.929313+00:00"} {"global_step": 236939, "acc_step": 0, "speed/wps": 5525.7736478567, "speed/FLOPS": 244210911761777.44, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04686790332198143, "optim/lr": 7.3143781448368196e-06, "optim/total_tokens": 1987588390912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2629717588424683, "created_at": "2025-06-03T09:29:49.899375+00:00"} {"global_step": 236940, "acc_step": 0, "speed/wps": 5534.616491038925, "speed/FLOPS": 244601720168657.3, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 194.7, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04745195806026459, "optim/lr": 7.310830919742273e-06, "optim/total_tokens": 1987596779520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2678179740905762, "created_at": "2025-06-03T09:29:52.865394+00:00"} {"global_step": 236941, "acc_step": 0, "speed/wps": 5521.774009076159, "speed/FLOPS": 244034148199684.62, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04887497425079346, "optim/lr": 7.307283694647726e-06, "optim/total_tokens": 1987605168128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.267722249031067, "created_at": "2025-06-03T09:29:55.842343+00:00"} {"global_step": 236942, "acc_step": 0, "speed/wps": 5521.408192420291, "speed/FLOPS": 244017980975914.66, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.7 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.7, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04740598425269127, "optim/lr": 7.3037364695531795e-06, "optim/total_tokens": 1987613556736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2452993392944336, "created_at": "2025-06-03T09:29:58.817909+00:00"} {"global_step": 236943, "acc_step": 0, "speed/wps": 5522.723992214442, "speed/FLOPS": 244076132591942.25, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048013921827077866, "optim/lr": 7.300189244458855e-06, "optim/total_tokens": 1987621945344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2657747268676758, "created_at": "2025-06-03T09:30:01.789400+00:00"} {"global_step": 236944, "acc_step": 0, "speed/wps": 5532.112284001541, "speed/FLOPS": 244491047035298.5, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04811527952551842, "optim/lr": 7.296642019364308e-06, "optim/total_tokens": 1987630333952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2641500234603882, "created_at": "2025-06-03T09:30:04.755329+00:00"} {"global_step": 236945, "acc_step": 0, "speed/wps": 5530.66459604446, "speed/FLOPS": 244427066637534.22, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04720137268304825, "optim/lr": 7.2930947942697614e-06, "optim/total_tokens": 1987638722560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2530808448791504, "created_at": "2025-06-03T09:30:07.727286+00:00"} {"global_step": 236946, "acc_step": 0, "speed/wps": 5522.101978342794, "speed/FLOPS": 244048642762571.0, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0467696450650692, "optim/lr": 7.289547569175214e-06, "optim/total_tokens": 1987647111168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2627472877502441, "created_at": "2025-06-03T09:30:10.701462+00:00"} {"global_step": 236947, "acc_step": 0, "speed/wps": 5515.0630541447445, "speed/FLOPS": 243737558341497.34, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05505920574069023, "optim/lr": 7.28600034408089e-06, "optim/total_tokens": 1987655499776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2571115493774414, "created_at": "2025-06-03T09:30:13.677416+00:00"} {"global_step": 236948, "acc_step": 0, "speed/wps": 5529.496009311157, "speed/FLOPS": 244375421085291.3, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04800383374094963, "optim/lr": 7.282453118986343e-06, "optim/total_tokens": 1987663888384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2676615715026855, "created_at": "2025-06-03T09:30:16.650404+00:00"} {"global_step": 236949, "acc_step": 0, "speed/wps": 5522.965314972118, "speed/FLOPS": 244086797822629.7, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04791174456477165, "optim/lr": 7.278905893891796e-06, "optim/total_tokens": 1987672276992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2840111255645752, "created_at": "2025-06-03T09:30:19.622396+00:00"} {"global_step": 236950, "acc_step": 0, "speed/wps": 5523.422910836741, "speed/FLOPS": 244107021217658.06, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04764091968536377, "optim/lr": 7.275358668797472e-06, "optim/total_tokens": 1987680665600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2494341135025024, "created_at": "2025-06-03T09:30:22.596669+00:00"} {"global_step": 236951, "acc_step": 0, "speed/wps": 5524.984499043635, "speed/FLOPS": 244176035423469.75, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05188475176692009, "optim/lr": 7.271811443702925e-06, "optim/total_tokens": 1987689054208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2421537637710571, "created_at": "2025-06-03T09:30:25.572491+00:00"} {"global_step": 236952, "acc_step": 0, "speed/wps": 5531.030097853709, "speed/FLOPS": 244443219946695.16, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04742886498570442, "optim/lr": 7.268264218608378e-06, "optim/total_tokens": 1987697442816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2711364030838013, "created_at": "2025-06-03T09:30:28.540441+00:00"} {"global_step": 236953, "acc_step": 0, "speed/wps": 5515.443080376238, "speed/FLOPS": 243754353555778.75, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.69 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.69, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04713115468621254, "optim/lr": 7.2647169935138316e-06, "optim/total_tokens": 1987705831424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2481894493103027, "created_at": "2025-06-03T09:30:31.515660+00:00"} {"global_step": 236954, "acc_step": 0, "speed/wps": 5524.752640889647, "speed/FLOPS": 244165788479821.12, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04763462767004967, "optim/lr": 7.261169768419506e-06, "optim/total_tokens": 1987714220032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2661831378936768, "created_at": "2025-06-03T09:30:34.489651+00:00"} {"global_step": 236955, "acc_step": 0, "speed/wps": 5524.8478984694, "speed/FLOPS": 244169998377273.7, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04728953540325165, "optim/lr": 7.25762254332496e-06, "optim/total_tokens": 1987722608640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.253483533859253, "created_at": "2025-06-03T09:30:37.463058+00:00"} {"global_step": 236956, "acc_step": 0, "speed/wps": 5521.454830172706, "speed/FLOPS": 244020042125857.75, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0473816804587841, "optim/lr": 7.2540753182304135e-06, "optim/total_tokens": 1987730997248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2707997560501099, "created_at": "2025-06-03T09:30:40.439543+00:00"} {"global_step": 236957, "acc_step": 0, "speed/wps": 5519.587878780971, "speed/FLOPS": 243937532430266.53, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04669836908578873, "optim/lr": 7.250528093135866e-06, "optim/total_tokens": 1987739385856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2578439712524414, "created_at": "2025-06-03T09:30:43.415869+00:00"} {"global_step": 236958, "acc_step": 0, "speed/wps": 5527.956909445868, "speed/FLOPS": 244307400749072.84, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04686790332198143, "optim/lr": 7.246980868041542e-06, "optim/total_tokens": 1987747774464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2588942050933838, "created_at": "2025-06-03T09:30:46.387040+00:00"} {"global_step": 236959, "acc_step": 0, "speed/wps": 5526.1726856550595, "speed/FLOPS": 244228547190004.3, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0474475733935833, "optim/lr": 7.2434336429469945e-06, "optim/total_tokens": 1987756163072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264095664024353, "created_at": "2025-06-03T09:30:49.356534+00:00"} {"global_step": 236960, "acc_step": 0, "speed/wps": 5520.668391273549, "speed/FLOPS": 243985285551874.2, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04767687991261482, "optim/lr": 7.239886417852448e-06, "optim/total_tokens": 1987764551680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2586276531219482, "created_at": "2025-06-03T09:30:52.329714+00:00"} {"global_step": 236961, "acc_step": 0, "speed/wps": 5512.819998162336, "speed/FLOPS": 243638426748076.16, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04815041646361351, "optim/lr": 7.236339192757902e-06, "optim/total_tokens": 1987772940288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2617114782333374, "created_at": "2025-06-03T09:30:55.309538+00:00"} {"global_step": 236962, "acc_step": 0, "speed/wps": 5532.24746646088, "speed/FLOPS": 244497021408074.72, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04690054804086685, "optim/lr": 7.232791967663576e-06, "optim/total_tokens": 1987781328896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2700066566467285, "created_at": "2025-06-03T09:30:58.276634+00:00"} {"global_step": 236963, "acc_step": 0, "speed/wps": 5514.726756399043, "speed/FLOPS": 243722695702465.22, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04848967492580414, "optim/lr": 7.22924474256903e-06, "optim/total_tokens": 1987789717504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.27284836769104, "created_at": "2025-06-03T09:31:01.252237+00:00"} {"global_step": 236964, "acc_step": 0, "speed/wps": 5512.383188738527, "speed/FLOPS": 243619122007337.12, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04684475436806679, "optim/lr": 7.225697517474484e-06, "optim/total_tokens": 1987798106112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2661230564117432, "created_at": "2025-06-03T09:31:04.231021+00:00"} {"global_step": 236965, "acc_step": 0, "speed/wps": 5526.1917907957195, "speed/FLOPS": 244229391539432.53, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04748227447271347, "optim/lr": 7.222150292379936e-06, "optim/total_tokens": 1987806494720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.25570547580719, "created_at": "2025-06-03T09:31:07.200549+00:00"} {"global_step": 236966, "acc_step": 0, "speed/wps": 5536.1604749261605, "speed/FLOPS": 244669956353647.16, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04810220003128052, "optim/lr": 7.218603067285612e-06, "optim/total_tokens": 1987814883328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2797185182571411, "created_at": "2025-06-03T09:31:10.165331+00:00"} {"global_step": 236967, "acc_step": 0, "speed/wps": 5528.514709302996, "speed/FLOPS": 244332052647679.4, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047384124249219894, "optim/lr": 7.215055842191065e-06, "optim/total_tokens": 1987823271936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.264266014099121, "created_at": "2025-06-03T09:31:13.134170+00:00"} {"global_step": 236968, "acc_step": 0, "speed/wps": 5509.7253001265, "speed/FLOPS": 243501656934992.72, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047041118144989014, "optim/lr": 7.211508617096518e-06, "optim/total_tokens": 1987831660544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.265569806098938, "created_at": "2025-06-03T09:31:16.117733+00:00"} {"global_step": 236969, "acc_step": 0, "speed/wps": 5515.213412912223, "speed/FLOPS": 243744203429413.97, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.68 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.68, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04745768383145332, "optim/lr": 7.207961392001972e-06, "optim/total_tokens": 1987840049152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2584806680679321, "created_at": "2025-06-03T09:31:19.093221+00:00"} {"global_step": 236970, "acc_step": 0, "speed/wps": 5514.885561618304, "speed/FLOPS": 243729714080317.75, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04650302976369858, "optim/lr": 7.2044141669076466e-06, "optim/total_tokens": 1987848437760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2843270301818848, "created_at": "2025-06-03T09:31:22.070248+00:00"} {"global_step": 236971, "acc_step": 0, "speed/wps": 5512.432244366633, "speed/FLOPS": 243621290015009.97, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04656364768743515, "optim/lr": 7.2008669418131e-06, "optim/total_tokens": 1987856826368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2553136348724365, "created_at": "2025-06-03T09:31:25.050365+00:00"} {"global_step": 236972, "acc_step": 0, "speed/wps": 5536.12599312092, "speed/FLOPS": 244668432434349.4, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 194.75, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04681960865855217, "optim/lr": 7.197319716718553e-06, "optim/total_tokens": 1987865214976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2441309690475464, "created_at": "2025-06-03T09:31:28.014792+00:00"} {"global_step": 236973, "acc_step": 0, "speed/wps": 5535.555120759025, "speed/FLOPS": 244643202797943.28, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04727904871106148, "optim/lr": 7.1937724916240065e-06, "optim/total_tokens": 1987873603584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.278052806854248, "created_at": "2025-06-03T09:31:30.979022+00:00"} {"global_step": 236974, "acc_step": 0, "speed/wps": 5537.187319595796, "speed/FLOPS": 244715337632177.56, "speed/curr_iter_time": 2.9567, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9567, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.63, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04685118794441223, "optim/lr": 7.190225266529682e-06, "optim/total_tokens": 1987881992192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2669928073883057, "created_at": "2025-06-03T09:31:33.942328+00:00"} {"global_step": 236975, "acc_step": 0, "speed/wps": 5532.0849342115225, "speed/FLOPS": 244489838314568.6, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04677964746952057, "optim/lr": 7.186678041435135e-06, "optim/total_tokens": 1987890380800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.267106294631958, "created_at": "2025-06-03T09:31:36.908303+00:00"} {"global_step": 236976, "acc_step": 0, "speed/wps": 5523.3448742371, "speed/FLOPS": 244103572399381.47, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04897690191864967, "optim/lr": 7.183130816340588e-06, "optim/total_tokens": 1987898769408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.247880458831787, "created_at": "2025-06-03T09:31:39.883250+00:00"} {"global_step": 236977, "acc_step": 0, "speed/wps": 5531.124658603994, "speed/FLOPS": 244447399047851.97, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04684000462293625, "optim/lr": 7.179583591246264e-06, "optim/total_tokens": 1987907158016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2670518159866333, "created_at": "2025-06-03T09:31:42.853205+00:00"} {"global_step": 236978, "acc_step": 0, "speed/wps": 5530.960547295775, "speed/FLOPS": 244440146168026.5, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047830116003751755, "optim/lr": 7.176036366151717e-06, "optim/total_tokens": 1987915546624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2622495889663696, "created_at": "2025-06-03T09:31:45.820028+00:00"} {"global_step": 236979, "acc_step": 0, "speed/wps": 5519.12248270239, "speed/FLOPS": 243916964305706.3, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.67 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.67, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.055592846125364304, "optim/lr": 7.17248914105717e-06, "optim/total_tokens": 1987923935232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2521367073059082, "created_at": "2025-06-03T09:31:48.797790+00:00"} {"global_step": 236980, "acc_step": 0, "speed/wps": 5524.0669411193885, "speed/FLOPS": 244135484059705.25, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0507822260260582, "optim/lr": 7.168941915962623e-06, "optim/total_tokens": 1987932323840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2600562572479248, "created_at": "2025-06-03T09:31:51.768254+00:00"} {"global_step": 236981, "acc_step": 0, "speed/wps": 5525.005297750938, "speed/FLOPS": 244176954619875.1, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046901945024728775, "optim/lr": 7.165394690868299e-06, "optim/total_tokens": 1987940712448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2646235227584839, "created_at": "2025-06-03T09:31:54.740392+00:00"} {"global_step": 236982, "acc_step": 0, "speed/wps": 5529.317930254542, "speed/FLOPS": 244367550902480.22, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050342630594968796, "optim/lr": 7.161847465773752e-06, "optim/total_tokens": 1987949101056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2487543821334839, "created_at": "2025-06-03T09:31:57.707845+00:00"} {"global_step": 236983, "acc_step": 0, "speed/wps": 5534.433329654541, "speed/FLOPS": 244593625372972.47, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04713641479611397, "optim/lr": 7.158300240679205e-06, "optim/total_tokens": 1987957489664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2667465209960938, "created_at": "2025-06-03T09:32:00.672845+00:00"} {"global_step": 236984, "acc_step": 0, "speed/wps": 5516.960091461964, "speed/FLOPS": 243821397681001.22, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04718346148729324, "optim/lr": 7.1547530155846586e-06, "optim/total_tokens": 1987965878272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2595641613006592, "created_at": "2025-06-03T09:32:03.649703+00:00"} {"global_step": 236985, "acc_step": 0, "speed/wps": 5530.168582142101, "speed/FLOPS": 244405145361879.22, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04875559359788895, "optim/lr": 7.151205790490334e-06, "optim/total_tokens": 1987974266880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.262160301208496, "created_at": "2025-06-03T09:32:06.619542+00:00"} {"global_step": 236986, "acc_step": 0, "speed/wps": 5525.606234842256, "speed/FLOPS": 244203512963436.47, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046538740396499634, "optim/lr": 7.147658565395787e-06, "optim/total_tokens": 1987982655488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2666897773742676, "created_at": "2025-06-03T09:32:09.589145+00:00"} {"global_step": 236987, "acc_step": 0, "speed/wps": 5529.041054138106, "speed/FLOPS": 244355314395314.16, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0479586236178875, "optim/lr": 7.1441113403012405e-06, "optim/total_tokens": 1987991044096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2535778284072876, "created_at": "2025-06-03T09:32:12.559258+00:00"} {"global_step": 236988, "acc_step": 0, "speed/wps": 5511.765894042461, "speed/FLOPS": 243591840741371.7, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.66 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.66, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04753116890788078, "optim/lr": 7.140564115206693e-06, "optim/total_tokens": 1987999432704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2667512893676758, "created_at": "2025-06-03T09:32:15.540209+00:00"} {"global_step": 236989, "acc_step": 0, "speed/wps": 5534.781133250686, "speed/FLOPS": 244608996511701.9, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04815565049648285, "optim/lr": 7.137016890112369e-06, "optim/total_tokens": 1988007821312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2526189088821411, "created_at": "2025-06-03T09:32:18.504783+00:00"} {"global_step": 236990, "acc_step": 0, "speed/wps": 5535.814282181867, "speed/FLOPS": 244654656406324.5, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04702599719166756, "optim/lr": 7.133469665017822e-06, "optim/total_tokens": 1988016209920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2626299858093262, "created_at": "2025-06-03T09:32:21.472151+00:00"} {"global_step": 236991, "acc_step": 0, "speed/wps": 5527.818424901049, "speed/FLOPS": 244301280441019.97, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0489477701485157, "optim/lr": 7.129922439923275e-06, "optim/total_tokens": 1988024598528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2639315128326416, "created_at": "2025-06-03T09:32:24.443829+00:00"} {"global_step": 236992, "acc_step": 0, "speed/wps": 5526.390713783968, "speed/FLOPS": 244238182917332.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04707694798707962, "optim/lr": 7.126375214828729e-06, "optim/total_tokens": 1988032987136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.255194067955017, "created_at": "2025-06-03T09:32:27.416647+00:00"} {"global_step": 236993, "acc_step": 0, "speed/wps": 5524.789912091797, "speed/FLOPS": 244167435676184.84, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04676266759634018, "optim/lr": 7.122827989734404e-06, "optim/total_tokens": 1988041375744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2554500102996826, "created_at": "2025-06-03T09:32:30.392908+00:00"} {"global_step": 236994, "acc_step": 0, "speed/wps": 5524.381323974167, "speed/FLOPS": 244149378172729.12, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04786257818341255, "optim/lr": 7.119280764639857e-06, "optim/total_tokens": 1988049764352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.286807894706726, "created_at": "2025-06-03T09:32:33.367321+00:00"} {"global_step": 236995, "acc_step": 0, "speed/wps": 5516.84564024634, "speed/FLOPS": 243816339523085.06, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.45, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0490071177482605, "optim/lr": 7.115733539545311e-06, "optim/total_tokens": 1988058152960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2446675300598145, "created_at": "2025-06-03T09:32:36.342037+00:00"} {"global_step": 236996, "acc_step": 0, "speed/wps": 5515.450787356483, "speed/FLOPS": 243754694164857.7, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046986352652311325, "optim/lr": 7.112186314450763e-06, "optim/total_tokens": 1988066541568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2748275995254517, "created_at": "2025-06-03T09:32:39.316903+00:00"} {"global_step": 236997, "acc_step": 0, "speed/wps": 5531.981016521436, "speed/FLOPS": 244485245684565.72, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 194.92, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04680058732628822, "optim/lr": 7.108639089356439e-06, "optim/total_tokens": 1988074930176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.242857813835144, "created_at": "2025-06-03T09:32:42.283111+00:00"} {"global_step": 236998, "acc_step": 0, "speed/wps": 5535.375668031747, "speed/FLOPS": 244635271905919.94, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 194.71, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0470360592007637, "optim/lr": 7.1050918642618925e-06, "optim/total_tokens": 1988083318784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2563945055007935, "created_at": "2025-06-03T09:32:45.248288+00:00"} {"global_step": 236999, "acc_step": 0, "speed/wps": 5528.932302369156, "speed/FLOPS": 244350508123768.56, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048229776322841644, "optim/lr": 7.101544639167345e-06, "optim/total_tokens": 1988091707392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2534430027008057, "created_at": "2025-06-03T09:32:48.215941+00:00"} {"global_step": 237000, "acc_step": 0, "speed/wps": 5528.119688225181, "speed/FLOPS": 244314594737941.12, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.65 hours", "speed/est_time_elapsed_hrs": 195.06, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.65, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04611271247267723, "optim/lr": 7.097997414072799e-06, "optim/total_tokens": 1988100096000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2528679370880127, "created_at": "2025-06-03T09:32:51.190510+00:00"} {"global_step": 237001, "acc_step": 0, "speed/wps": 223.6355846180785, "speed/FLOPS": 9883548169430.082, "speed/curr_iter_time": 5.7382, "speed/data_load_time": 3.8515, "speed/curr_step_time": 5.7382, "speed/est_time_elapsed": "15.74 days", "speed/est_time_remaining": "3.19 hours", "speed/est_time_elapsed_hrs": 377.77, "speed/est_time_elapsed_days": 15.74, "speed/est_time_remaining_hrs": 3.19, "speed/est_time_remaining_days": 0.13, "optim/grad_norm": 0.04651501029729843, "optim/lr": 7.094450188978474e-06, "optim/total_tokens": 1988108484608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2538394927978516, "created_at": "2025-06-03T09:34:04.459583+00:00"} {"global_step": 237002, "acc_step": 0, "speed/wps": 5624.7027553051075, "speed/FLOPS": 248583071945922.03, "speed/curr_iter_time": 2.9096, "speed/data_load_time": 0.0013, "speed/curr_step_time": 2.9096, "speed/est_time_elapsed": "7.98 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 191.55, "speed/est_time_elapsed_days": 7.98, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0471423976123333, "optim/lr": 7.090902963883927e-06, "optim/total_tokens": 1988116873216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2681925296783447, "created_at": "2025-06-03T09:34:07.381643+00:00"} {"global_step": 237003, "acc_step": 0, "speed/wps": 5577.8097707129955, "speed/FLOPS": 246510642047004.16, "speed/curr_iter_time": 2.9362, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9362, "speed/est_time_elapsed": "8.05 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 193.3, "speed/est_time_elapsed_days": 8.05, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047480508685112, "optim/lr": 7.087355738789381e-06, "optim/total_tokens": 1988125261824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2737385034561157, "created_at": "2025-06-03T09:34:10.325922+00:00"} {"global_step": 237004, "acc_step": 0, "speed/wps": 5587.2824845758805, "speed/FLOPS": 246929287513998.78, "speed/curr_iter_time": 2.93, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.93, "speed/est_time_elapsed": "8.04 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 192.89, "speed/est_time_elapsed_days": 8.04, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048709046095609665, "optim/lr": 7.0838085136950555e-06, "optim/total_tokens": 1988133650432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2632770538330078, "created_at": "2025-06-03T09:34:13.267138+00:00"} {"global_step": 237005, "acc_step": 0, "speed/wps": 5554.954972388682, "speed/FLOPS": 245500576942531.97, "speed/curr_iter_time": 2.9484, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9484, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.11, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04677971079945564, "optim/lr": 7.080261288600509e-06, "optim/total_tokens": 1988142039040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2753671407699585, "created_at": "2025-06-03T09:34:16.225604+00:00"} {"global_step": 237006, "acc_step": 0, "speed/wps": 5539.222559404276, "speed/FLOPS": 244805284814410.7, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 194.66, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04618944227695465, "optim/lr": 7.076714063505963e-06, "optim/total_tokens": 1988150427648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2575571537017822, "created_at": "2025-06-03T09:34:19.189480+00:00"} {"global_step": 237007, "acc_step": 0, "speed/wps": 5539.09461503084, "speed/FLOPS": 244799630327983.5, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 194.67, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04787864536046982, "optim/lr": 7.073166838411415e-06, "optim/total_tokens": 1988158816256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.25154709815979, "created_at": "2025-06-03T09:34:22.155254+00:00"} {"global_step": 237008, "acc_step": 0, "speed/wps": 5550.097919700127, "speed/FLOPS": 245285920074347.16, "speed/curr_iter_time": 2.9498, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9498, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04815274849534035, "optim/lr": 7.069619613317091e-06, "optim/total_tokens": 1988167204864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2601169347763062, "created_at": "2025-06-03T09:34:25.112372+00:00"} {"global_step": 237009, "acc_step": 0, "speed/wps": 5539.814535810779, "speed/FLOPS": 244831447141568.2, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04622538015246391, "optim/lr": 7.0660723882225446e-06, "optim/total_tokens": 1988175593472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.242011308670044, "created_at": "2025-06-03T09:34:28.075590+00:00"} {"global_step": 237010, "acc_step": 0, "speed/wps": 5530.617868216111, "speed/FLOPS": 244425001506695.88, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04791874811053276, "optim/lr": 7.062525163127997e-06, "optim/total_tokens": 1988183982080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2660609483718872, "created_at": "2025-06-03T09:34:31.044499+00:00"} {"global_step": 237011, "acc_step": 0, "speed/wps": 5520.174179935394, "speed/FLOPS": 243963443940330.7, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04802347347140312, "optim/lr": 7.058977938033451e-06, "optim/total_tokens": 1988192370688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.256263017654419, "created_at": "2025-06-03T09:34:34.021211+00:00"} {"global_step": 237012, "acc_step": 0, "speed/wps": 5537.532123621566, "speed/FLOPS": 244730576205249.62, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.73, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04827845096588135, "optim/lr": 7.055430712939126e-06, "optim/total_tokens": 1988200759296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.257567048072815, "created_at": "2025-06-03T09:34:36.987615+00:00"} {"global_step": 237013, "acc_step": 0, "speed/wps": 5526.69766961397, "speed/FLOPS": 244251748793876.66, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046732135117053986, "optim/lr": 7.051883487844579e-06, "optim/total_tokens": 1988209147904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2641180753707886, "created_at": "2025-06-03T09:34:39.962015+00:00"} {"global_step": 237014, "acc_step": 0, "speed/wps": 5530.804644291509, "speed/FLOPS": 244433256053221.88, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047659434378147125, "optim/lr": 7.048336262750033e-06, "optim/total_tokens": 1988217536512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2665399312973022, "created_at": "2025-06-03T09:34:42.932963+00:00"} {"global_step": 237015, "acc_step": 0, "speed/wps": 5523.362085210852, "speed/FLOPS": 244104333036327.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.64 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.64, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04731590673327446, "optim/lr": 7.0447890376554856e-06, "optim/total_tokens": 1988225925120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2499679327011108, "created_at": "2025-06-03T09:34:45.908808+00:00"} {"global_step": 237016, "acc_step": 0, "speed/wps": 5542.322049087522, "speed/FLOPS": 244942266393783.8, "speed/curr_iter_time": 2.9553, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9553, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.57, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04683408886194229, "optim/lr": 7.041241812561161e-06, "optim/total_tokens": 1988234313728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.272964358329773, "created_at": "2025-06-03T09:34:48.870132+00:00"} {"global_step": 237017, "acc_step": 0, "speed/wps": 5553.111419972538, "speed/FLOPS": 245419101361895.06, "speed/curr_iter_time": 2.9496, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9496, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 194.2, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048091866075992584, "optim/lr": 7.037694587466615e-06, "optim/total_tokens": 1988242702336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.242522120475769, "created_at": "2025-06-03T09:34:51.829793+00:00"} {"global_step": 237018, "acc_step": 0, "speed/wps": 5543.112477419131, "speed/FLOPS": 244977199280261.97, "speed/curr_iter_time": 2.9534, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9534, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.45, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04783054068684578, "optim/lr": 7.0341473623720675e-06, "optim/total_tokens": 1988251090944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.258972406387329, "created_at": "2025-06-03T09:34:54.792707+00:00"} {"global_step": 237019, "acc_step": 0, "speed/wps": 5534.658928535426, "speed/FLOPS": 244603595688787.84, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.84, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04687841609120369, "optim/lr": 7.030600137277521e-06, "optim/total_tokens": 1988259479552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2595807313919067, "created_at": "2025-06-03T09:34:57.757574+00:00"} {"global_step": 237020, "acc_step": 0, "speed/wps": 5523.8909434570505, "speed/FLOPS": 244127705863867.62, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05026742070913315, "optim/lr": 7.027052912183196e-06, "optim/total_tokens": 1988267868160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2723225355148315, "created_at": "2025-06-03T09:35:00.732074+00:00"} {"global_step": 237021, "acc_step": 0, "speed/wps": 5532.9589156118445, "speed/FLOPS": 244528463819020.5, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.81, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04743971675634384, "optim/lr": 7.023505687088649e-06, "optim/total_tokens": 1988276256768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2702561616897583, "created_at": "2025-06-03T09:35:03.698742+00:00"} {"global_step": 237022, "acc_step": 0, "speed/wps": 5533.647015841929, "speed/FLOPS": 244558874327173.97, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04765566438436508, "optim/lr": 7.019958461994103e-06, "optim/total_tokens": 1988284645376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2590428590774536, "created_at": "2025-06-03T09:35:06.667254+00:00"} {"global_step": 237023, "acc_step": 0, "speed/wps": 5519.863963059645, "speed/FLOPS": 243949733942256.5, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04767245054244995, "optim/lr": 7.016411236899556e-06, "optim/total_tokens": 1988293033984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2548738718032837, "created_at": "2025-06-03T09:35:09.640540+00:00"} {"global_step": 237024, "acc_step": 0, "speed/wps": 5542.872865799457, "speed/FLOPS": 244966609673115.84, "speed/curr_iter_time": 2.9537, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9537, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 194.47, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0472380556166172, "optim/lr": 7.012864011805231e-06, "optim/total_tokens": 1988301422592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2427518367767334, "created_at": "2025-06-03T09:35:12.605242+00:00"} {"global_step": 237025, "acc_step": 0, "speed/wps": 5531.059043605213, "speed/FLOPS": 244444499200753.88, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048584457486867905, "optim/lr": 7.009316786710684e-06, "optim/total_tokens": 1988309811200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2709087133407593, "created_at": "2025-06-03T09:35:15.575085+00:00"} {"global_step": 237026, "acc_step": 0, "speed/wps": 5527.008395932656, "speed/FLOPS": 244265481306721.1, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046575918793678284, "optim/lr": 7.005769561616138e-06, "optim/total_tokens": 1988318199808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.259398102760315, "created_at": "2025-06-03T09:35:18.544071+00:00"} {"global_step": 237027, "acc_step": 0, "speed/wps": 5520.77907307469, "speed/FLOPS": 243990177120963.8, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04907349869608879, "optim/lr": 7.002222336521591e-06, "optim/total_tokens": 1988326588416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2808438539505005, "created_at": "2025-06-03T09:35:21.522102+00:00"} {"global_step": 237028, "acc_step": 0, "speed/wps": 5510.632949034819, "speed/FLOPS": 243541770370972.16, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047116782516241074, "optim/lr": 6.998675111427266e-06, "optim/total_tokens": 1988334977024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2653894424438477, "created_at": "2025-06-03T09:35:24.503586+00:00"} {"global_step": 237029, "acc_step": 0, "speed/wps": 5524.863853492823, "speed/FLOPS": 244170703507643.78, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050500743091106415, "optim/lr": 6.9951278863327195e-06, "optim/total_tokens": 1988343365632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2741293907165527, "created_at": "2025-06-03T09:35:27.474495+00:00"} {"global_step": 237030, "acc_step": 0, "speed/wps": 5521.054653193707, "speed/FLOPS": 244002356351677.44, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047790199518203735, "optim/lr": 6.991580661238173e-06, "optim/total_tokens": 1988351754240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.26167631149292, "created_at": "2025-06-03T09:35:30.449116+00:00"} {"global_step": 237031, "acc_step": 0, "speed/wps": 5506.946560351851, "speed/FLOPS": 243378850859832.72, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.63 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.63, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04662661999464035, "optim/lr": 6.988033436143848e-06, "optim/total_tokens": 1988360142848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2486928701400757, "created_at": "2025-06-03T09:35:33.432880+00:00"} {"global_step": 237032, "acc_step": 0, "speed/wps": 5520.439817643268, "speed/FLOPS": 243975183767361.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04755640774965286, "optim/lr": 6.984486211049301e-06, "optim/total_tokens": 1988368531456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.270990252494812, "created_at": "2025-06-03T09:35:36.409180+00:00"} {"global_step": 237033, "acc_step": 0, "speed/wps": 5514.636564199866, "speed/FLOPS": 243718709668907.16, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04707992076873779, "optim/lr": 6.980938985954754e-06, "optim/total_tokens": 1988376920064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.265604019165039, "created_at": "2025-06-03T09:35:39.384775+00:00"} {"global_step": 237034, "acc_step": 0, "speed/wps": 5529.510712881601, "speed/FLOPS": 244376070907845.25, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04839468374848366, "optim/lr": 6.977391760860208e-06, "optim/total_tokens": 1988385308672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2611854076385498, "created_at": "2025-06-03T09:35:42.356733+00:00"} {"global_step": 237035, "acc_step": 0, "speed/wps": 5529.244493037862, "speed/FLOPS": 244364305353388.72, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046743642538785934, "optim/lr": 6.973844535765883e-06, "optim/total_tokens": 1988393697280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2630361318588257, "created_at": "2025-06-03T09:35:45.324517+00:00"} {"global_step": 237036, "acc_step": 0, "speed/wps": 5517.429702921813, "speed/FLOPS": 243842152103837.22, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04720142483711243, "optim/lr": 6.970297310671336e-06, "optim/total_tokens": 1988402085888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2662941217422485, "created_at": "2025-06-03T09:35:48.303786+00:00"} {"global_step": 237037, "acc_step": 0, "speed/wps": 5510.335855654517, "speed/FLOPS": 243528640364224.6, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04751915484666824, "optim/lr": 6.96675008557679e-06, "optim/total_tokens": 1988410474496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2744983434677124, "created_at": "2025-06-03T09:35:51.281870+00:00"} {"global_step": 237038, "acc_step": 0, "speed/wps": 5520.132438875776, "speed/FLOPS": 243961599199145.66, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04703963175415993, "optim/lr": 6.963202860482242e-06, "optim/total_tokens": 1988418863104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2724143266677856, "created_at": "2025-06-03T09:35:54.256990+00:00"} {"global_step": 237039, "acc_step": 0, "speed/wps": 5519.304544604668, "speed/FLOPS": 243925010509909.72, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04866141453385353, "optim/lr": 6.959655635387918e-06, "optim/total_tokens": 1988427251712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2584805488586426, "created_at": "2025-06-03T09:35:57.229939+00:00"} {"global_step": 237040, "acc_step": 0, "speed/wps": 5505.023023643728, "speed/FLOPS": 243293840382887.1, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047813381999731064, "optim/lr": 6.9561084102933716e-06, "optim/total_tokens": 1988435640320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.252941608428955, "created_at": "2025-06-03T09:36:00.210421+00:00"} {"global_step": 237041, "acc_step": 0, "speed/wps": 5512.9886029018935, "speed/FLOPS": 243645878214567.34, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.62 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.62, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04701431840658188, "optim/lr": 6.952561185198824e-06, "optim/total_tokens": 1988444028928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2654798030853271, "created_at": "2025-06-03T09:36:03.188595+00:00"} {"global_step": 237042, "acc_step": 0, "speed/wps": 5525.208189446758, "speed/FLOPS": 244185921394336.53, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04776723310351372, "optim/lr": 6.949013960104278e-06, "optim/total_tokens": 1988452417536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2661893367767334, "created_at": "2025-06-03T09:36:06.158470+00:00"} {"global_step": 237043, "acc_step": 0, "speed/wps": 5524.578950776773, "speed/FLOPS": 244158112265858.66, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0489574633538723, "optim/lr": 6.9454667350099534e-06, "optim/total_tokens": 1988460806144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2496380805969238, "created_at": "2025-06-03T09:36:09.132003+00:00"} {"global_step": 237044, "acc_step": 0, "speed/wps": 5518.267751547878, "speed/FLOPS": 243879189563587.56, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04809156060218811, "optim/lr": 6.941919509915406e-06, "optim/total_tokens": 1988469194752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2802923917770386, "created_at": "2025-06-03T09:36:12.109858+00:00"} {"global_step": 237045, "acc_step": 0, "speed/wps": 5517.57048254432, "speed/FLOPS": 243848373842576.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046310245990753174, "optim/lr": 6.93837228482086e-06, "optim/total_tokens": 1988477583360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.263330101966858, "created_at": "2025-06-03T09:36:15.085367+00:00"} {"global_step": 237046, "acc_step": 0, "speed/wps": 5521.391474071806, "speed/FLOPS": 244017242110483.9, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04715801402926445, "optim/lr": 6.9348250597263126e-06, "optim/total_tokens": 1988485971968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2685381174087524, "created_at": "2025-06-03T09:36:18.062011+00:00"} {"global_step": 237047, "acc_step": 0, "speed/wps": 5505.532528543431, "speed/FLOPS": 243316357891571.47, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04676134139299393, "optim/lr": 6.931277834631988e-06, "optim/total_tokens": 1988494360576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2677385807037354, "created_at": "2025-06-03T09:36:21.042954+00:00"} {"global_step": 237048, "acc_step": 0, "speed/wps": 5515.40130492369, "speed/FLOPS": 243752507294602.28, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05049583688378334, "optim/lr": 6.927730609537442e-06, "optim/total_tokens": 1988502749184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2514541149139404, "created_at": "2025-06-03T09:36:24.018107+00:00"} {"global_step": 237049, "acc_step": 0, "speed/wps": 5512.174527471752, "speed/FLOPS": 243609900247370.88, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.058555446565151215, "optim/lr": 6.9241833844428945e-06, "optim/total_tokens": 1988511137792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.254202961921692, "created_at": "2025-06-03T09:36:26.999982+00:00"} {"global_step": 237050, "acc_step": 0, "speed/wps": 5513.137416713326, "speed/FLOPS": 243652455023334.53, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0466855950653553, "optim/lr": 6.920636159348348e-06, "optim/total_tokens": 1988519526400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2769469022750854, "created_at": "2025-06-03T09:36:29.979687+00:00"} {"global_step": 237051, "acc_step": 0, "speed/wps": 5514.513335151818, "speed/FLOPS": 243713263575726.84, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04834925755858421, "optim/lr": 6.917088934254024e-06, "optim/total_tokens": 1988527915008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2672119140625, "created_at": "2025-06-03T09:36:32.955645+00:00"} {"global_step": 237052, "acc_step": 0, "speed/wps": 5528.711478244553, "speed/FLOPS": 244340748827741.47, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048692792654037476, "optim/lr": 6.913541709159476e-06, "optim/total_tokens": 1988536303616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2492284774780273, "created_at": "2025-06-03T09:36:35.926083+00:00"} {"global_step": 237053, "acc_step": 0, "speed/wps": 5511.406652528702, "speed/FLOPS": 243575964105228.28, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04802244156599045, "optim/lr": 6.90999448406493e-06, "optim/total_tokens": 1988544692224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2628499269485474, "created_at": "2025-06-03T09:36:38.902980+00:00"} {"global_step": 237054, "acc_step": 0, "speed/wps": 5500.829490773209, "speed/FLOPS": 243108507694457.16, "speed/curr_iter_time": 2.9776, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9776, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0486152209341526, "optim/lr": 6.906447258970383e-06, "optim/total_tokens": 1988553080832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2689059972763062, "created_at": "2025-06-03T09:36:41.885937+00:00"} {"global_step": 237055, "acc_step": 0, "speed/wps": 5510.862720690372, "speed/FLOPS": 243551925102069.66, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05140795558691025, "optim/lr": 6.902900033876058e-06, "optim/total_tokens": 1988561469440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2521799802780151, "created_at": "2025-06-03T09:36:44.864083+00:00"} {"global_step": 237056, "acc_step": 0, "speed/wps": 5503.549037934363, "speed/FLOPS": 243228697759075.94, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.61 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.61, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04683976620435715, "optim/lr": 6.899352808781512e-06, "optim/total_tokens": 1988569858048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2742059230804443, "created_at": "2025-06-03T09:36:47.849292+00:00"} {"global_step": 237057, "acc_step": 0, "speed/wps": 5509.030640097697, "speed/FLOPS": 243470956517311.97, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.050123244524002075, "optim/lr": 6.895805583686965e-06, "optim/total_tokens": 1988578246656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2529237270355225, "created_at": "2025-06-03T09:36:50.827539+00:00"} {"global_step": 237058, "acc_step": 0, "speed/wps": 5518.898593540979, "speed/FLOPS": 243907069550740.6, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04963013902306557, "optim/lr": 6.89225835859264e-06, "optim/total_tokens": 1988586635264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.255528450012207, "created_at": "2025-06-03T09:36:53.806684+00:00"} {"global_step": 237059, "acc_step": 0, "speed/wps": 5519.912199764233, "speed/FLOPS": 243951865757701.47, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048510607331991196, "optim/lr": 6.888711133498094e-06, "optim/total_tokens": 1988595023872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2603530883789062, "created_at": "2025-06-03T09:36:56.780195+00:00"} {"global_step": 237060, "acc_step": 0, "speed/wps": 5523.318350237822, "speed/FLOPS": 244102400174375.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04739981144666672, "optim/lr": 6.8851639084035465e-06, "optim/total_tokens": 1988603412480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.260727047920227, "created_at": "2025-06-03T09:36:59.755178+00:00"} {"global_step": 237061, "acc_step": 0, "speed/wps": 5507.092758309015, "speed/FLOPS": 243385312061230.4, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04774898290634155, "optim/lr": 6.881616683309e-06, "optim/total_tokens": 1988611801088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.268187165260315, "created_at": "2025-06-03T09:37:02.738382+00:00"} {"global_step": 237062, "acc_step": 0, "speed/wps": 5504.934428890034, "speed/FLOPS": 243289924948242.88, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04649634659290314, "optim/lr": 6.878069458214676e-06, "optim/total_tokens": 1988620189696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.246809482574463, "created_at": "2025-06-03T09:37:05.722675+00:00"} {"global_step": 237063, "acc_step": 0, "speed/wps": 5520.737396931316, "speed/FLOPS": 243988335248744.5, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04686758294701576, "optim/lr": 6.874522233120128e-06, "optim/total_tokens": 1988628578304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2767280340194702, "created_at": "2025-06-03T09:37:08.694998+00:00"} {"global_step": 237064, "acc_step": 0, "speed/wps": 5516.246378306323, "speed/FLOPS": 243789855212637.0, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04780161753296852, "optim/lr": 6.870975008025582e-06, "optim/total_tokens": 1988636966912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2467020750045776, "created_at": "2025-06-03T09:37:11.674260+00:00"} {"global_step": 237065, "acc_step": 0, "speed/wps": 5508.086965021124, "speed/FLOPS": 243429250909094.38, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04853665456175804, "optim/lr": 6.867427782931035e-06, "optim/total_tokens": 1988645355520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2731972932815552, "created_at": "2025-06-03T09:37:14.655020+00:00"} {"global_step": 237066, "acc_step": 0, "speed/wps": 5517.137753020141, "speed/FLOPS": 243829249412518.34, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046708475798368454, "optim/lr": 6.86388055783671e-06, "optim/total_tokens": 1988653744128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2694144248962402, "created_at": "2025-06-03T09:37:17.632820+00:00"} {"global_step": 237067, "acc_step": 0, "speed/wps": 5514.410063159936, "speed/FLOPS": 243708699482279.66, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048145588487386703, "optim/lr": 6.860333332742164e-06, "optim/total_tokens": 1988662132736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.257074236869812, "created_at": "2025-06-03T09:37:20.608678+00:00"} {"global_step": 237068, "acc_step": 0, "speed/wps": 5521.517595476768, "speed/FLOPS": 244022816031035.34, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049435924738645554, "optim/lr": 6.856786107647617e-06, "optim/total_tokens": 1988670521344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2585175037384033, "created_at": "2025-06-03T09:37:23.580551+00:00"} {"global_step": 237069, "acc_step": 0, "speed/wps": 5501.108312221897, "speed/FLOPS": 243120830175351.62, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047690778970718384, "optim/lr": 6.85323888255307e-06, "optim/total_tokens": 1988678909952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2568305730819702, "created_at": "2025-06-03T09:37:26.562832+00:00"} {"global_step": 237070, "acc_step": 0, "speed/wps": 5513.912545645943, "speed/FLOPS": 243686711754686.66, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047262560576200485, "optim/lr": 6.849691657458745e-06, "optim/total_tokens": 1988687298560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2556052207946777, "created_at": "2025-06-03T09:37:29.542175+00:00"} {"global_step": 237071, "acc_step": 0, "speed/wps": 5526.572234229713, "speed/FLOPS": 244246205191929.0, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04918839409947395, "optim/lr": 6.8461444323641986e-06, "optim/total_tokens": 1988695687168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2715554237365723, "created_at": "2025-06-03T09:37:32.515484+00:00"} {"global_step": 237072, "acc_step": 0, "speed/wps": 5510.4536033866825, "speed/FLOPS": 243533844211298.75, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04634232074022293, "optim/lr": 6.842597207269652e-06, "optim/total_tokens": 1988704075776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2676301002502441, "created_at": "2025-06-03T09:37:35.497063+00:00"} {"global_step": 237073, "acc_step": 0, "speed/wps": 5500.512560005221, "speed/FLOPS": 243094500976710.8, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04763828590512276, "optim/lr": 6.839049982175105e-06, "optim/total_tokens": 1988712464384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2536916732788086, "created_at": "2025-06-03T09:37:38.483540+00:00"} {"global_step": 237074, "acc_step": 0, "speed/wps": 5501.007629088467, "speed/FLOPS": 243116380496197.03, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04846200719475746, "optim/lr": 6.8355027570807804e-06, "optim/total_tokens": 1988720852992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2672080993652344, "created_at": "2025-06-03T09:37:41.467905+00:00"} {"global_step": 237075, "acc_step": 0, "speed/wps": 5515.997512234611, "speed/FLOPS": 243778856606079.34, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04739657789468765, "optim/lr": 6.831955531986234e-06, "optim/total_tokens": 1988729241600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2641732692718506, "created_at": "2025-06-03T09:37:44.442554+00:00"} {"global_step": 237076, "acc_step": 0, "speed/wps": 5512.453608507662, "speed/FLOPS": 243622234200691.8, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04652881249785423, "optim/lr": 6.828408306891687e-06, "optim/total_tokens": 1988737630208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2604848146438599, "created_at": "2025-06-03T09:37:47.419241+00:00"} {"global_step": 237077, "acc_step": 0, "speed/wps": 5512.094967314765, "speed/FLOPS": 243606384095657.84, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047753989696502686, "optim/lr": 6.82486108179714e-06, "optim/total_tokens": 1988746018816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2827255725860596, "created_at": "2025-06-03T09:37:50.395575+00:00"} {"global_step": 237078, "acc_step": 0, "speed/wps": 5514.260829763735, "speed/FLOPS": 243702104130013.34, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04659899324178696, "optim/lr": 6.821313856702815e-06, "optim/total_tokens": 1988754407424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2671749591827393, "created_at": "2025-06-03T09:37:53.375614+00:00"} {"global_step": 237079, "acc_step": 0, "speed/wps": 5530.857290008531, "speed/FLOPS": 244435582724449.03, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047669410705566406, "optim/lr": 6.817766631608269e-06, "optim/total_tokens": 1988762796032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2795864343643188, "created_at": "2025-06-03T09:37:56.345251+00:00"} {"global_step": 237080, "acc_step": 0, "speed/wps": 5520.610010980781, "speed/FLOPS": 243982705441751.28, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04774890094995499, "optim/lr": 6.814219406513722e-06, "optim/total_tokens": 1988771184640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2351545095443726, "created_at": "2025-06-03T09:37:59.321645+00:00"} {"global_step": 237081, "acc_step": 0, "speed/wps": 5501.591055273984, "speed/FLOPS": 243142164947350.97, "speed/curr_iter_time": 2.9772, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9772, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047290313988924026, "optim/lr": 6.810672181419175e-06, "optim/total_tokens": 1988779573248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2604963779449463, "created_at": "2025-06-03T09:38:02.307661+00:00"} {"global_step": 237082, "acc_step": 0, "speed/wps": 5512.082931721296, "speed/FLOPS": 243605852184030.25, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04632735624909401, "optim/lr": 6.807124956324851e-06, "optim/total_tokens": 1988787961856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2516666650772095, "created_at": "2025-06-03T09:38:05.289291+00:00"} {"global_step": 237083, "acc_step": 0, "speed/wps": 5497.953253585845, "speed/FLOPS": 242981392732692.2, "speed/curr_iter_time": 2.9792, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9792, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.59 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.59, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047459203749895096, "optim/lr": 6.803577731230303e-06, "optim/total_tokens": 1988796350464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.289709448814392, "created_at": "2025-06-03T09:38:08.274371+00:00"} {"global_step": 237084, "acc_step": 0, "speed/wps": 5523.947856810752, "speed/FLOPS": 244130221142792.25, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04781036078929901, "optim/lr": 6.800030506135757e-06, "optim/total_tokens": 1988804739072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2878711223602295, "created_at": "2025-06-03T09:38:11.249015+00:00"} {"global_step": 237085, "acc_step": 0, "speed/wps": 5518.040348942404, "speed/FLOPS": 243869139532377.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047024115920066833, "optim/lr": 6.7964832810414325e-06, "optim/total_tokens": 1988813127680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2860196828842163, "created_at": "2025-06-03T09:38:14.223828+00:00"} {"global_step": 237086, "acc_step": 0, "speed/wps": 5521.476702748499, "speed/FLOPS": 244021008781753.78, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0466364324092865, "optim/lr": 6.792936055946885e-06, "optim/total_tokens": 1988821516288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2532833814620972, "created_at": "2025-06-03T09:38:17.196441+00:00"} {"global_step": 237087, "acc_step": 0, "speed/wps": 5510.56260037162, "speed/FLOPS": 243538661320135.84, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04734228923916817, "optim/lr": 6.789388830852339e-06, "optim/total_tokens": 1988829904896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2506645917892456, "created_at": "2025-06-03T09:38:20.173884+00:00"} {"global_step": 237088, "acc_step": 0, "speed/wps": 5511.252962238573, "speed/FLOPS": 243569171781062.8, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049938492476940155, "optim/lr": 6.7858416057577925e-06, "optim/total_tokens": 1988838293504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2538933753967285, "created_at": "2025-06-03T09:38:23.153728+00:00"} {"global_step": 237089, "acc_step": 0, "speed/wps": 5516.122776351308, "speed/FLOPS": 243784392638877.47, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04850507900118828, "optim/lr": 6.782294380663467e-06, "optim/total_tokens": 1988846682112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2776157855987549, "created_at": "2025-06-03T09:38:26.132213+00:00"} {"global_step": 237090, "acc_step": 0, "speed/wps": 5514.910824747574, "speed/FLOPS": 243730830581323.1, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.047599583864212036, "optim/lr": 6.778747155568921e-06, "optim/total_tokens": 1988855070720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2643495798110962, "created_at": "2025-06-03T09:38:29.110559+00:00"} {"global_step": 237091, "acc_step": 0, "speed/wps": 5500.562665673337, "speed/FLOPS": 243096715390777.5, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.58 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.58, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04890502989292145, "optim/lr": 6.7751999304743735e-06, "optim/total_tokens": 1988863459328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2525584697723389, "created_at": "2025-06-03T09:38:32.093496+00:00"} {"global_step": 237092, "acc_step": 0, "speed/wps": 5519.912616740041, "speed/FLOPS": 243951884185897.88, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04906425252556801, "optim/lr": 6.771652705379827e-06, "optim/total_tokens": 1988871847936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2494893074035645, "created_at": "2025-06-03T09:38:35.068376+00:00"} {"global_step": 237093, "acc_step": 0, "speed/wps": 5517.008498455828, "speed/FLOPS": 243823537022360.56, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049738071858882904, "optim/lr": 6.768105480285503e-06, "optim/total_tokens": 1988880236544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2541937828063965, "created_at": "2025-06-03T09:38:38.044025+00:00"} {"global_step": 237094, "acc_step": 0, "speed/wps": 5514.598916021485, "speed/FLOPS": 243717045812123.53, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04726605862379074, "optim/lr": 6.764558255190955e-06, "optim/total_tokens": 1988888625152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2533986568450928, "created_at": "2025-06-03T09:38:41.022727+00:00"} {"global_step": 237095, "acc_step": 0, "speed/wps": 5511.985440386057, "speed/FLOPS": 243601543566018.6, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04754822701215744, "optim/lr": 6.761011030096409e-06, "optim/total_tokens": 1988897013760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.268502116203308, "created_at": "2025-06-03T09:38:43.999852+00:00"} {"global_step": 237096, "acc_step": 0, "speed/wps": 5511.293456768685, "speed/FLOPS": 243570961432023.97, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.052588336169719696, "optim/lr": 6.757463805001863e-06, "optim/total_tokens": 1988905402368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2636950016021729, "created_at": "2025-06-03T09:38:46.980508+00:00"} {"global_step": 237097, "acc_step": 0, "speed/wps": 5508.582983294838, "speed/FLOPS": 243451172377940.84, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04936608672142029, "optim/lr": 6.753916579907537e-06, "optim/total_tokens": 1988913790976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2657670974731445, "created_at": "2025-06-03T09:38:49.960901+00:00"} {"global_step": 237098, "acc_step": 0, "speed/wps": 5512.1234496751185, "speed/FLOPS": 243607642870199.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04712655767798424, "optim/lr": 6.750369354812991e-06, "optim/total_tokens": 1988922179584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2560145854949951, "created_at": "2025-06-03T09:38:52.941071+00:00"} {"global_step": 237099, "acc_step": 0, "speed/wps": 5507.026894247308, "speed/FLOPS": 243382401206825.75, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.055397577583789825, "optim/lr": 6.746822129718444e-06, "optim/total_tokens": 1988930568192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2611087560653687, "created_at": "2025-06-03T09:38:55.920149+00:00"} {"global_step": 237100, "acc_step": 0, "speed/wps": 5503.744494745267, "speed/FLOPS": 243237335949679.25, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04682197421789169, "optim/lr": 6.743274904623897e-06, "optim/total_tokens": 1988938956800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2518593072891235, "created_at": "2025-06-03T09:38:58.901425+00:00"} {"global_step": 237101, "acc_step": 0, "speed/wps": 5529.961910227777, "speed/FLOPS": 244396011521108.84, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.046428050845861435, "optim/lr": 6.739727679529573e-06, "optim/total_tokens": 1988947345408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.264165997505188, "created_at": "2025-06-03T09:39:01.868259+00:00"} {"global_step": 237102, "acc_step": 0, "speed/wps": 5515.482119556837, "speed/FLOPS": 243756078887740.6, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.049147944897413254, "optim/lr": 6.7361804544350256e-06, "optim/total_tokens": 1988955734016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.26819908618927, "created_at": "2025-06-03T09:39:04.843424+00:00"} {"global_step": 237103, "acc_step": 0, "speed/wps": 5509.13259921924, "speed/FLOPS": 243475462588610.06, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.57 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.57, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04797197878360748, "optim/lr": 6.732633229340479e-06, "optim/total_tokens": 1988964122624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2579143047332764, "created_at": "2025-06-03T09:39:07.822090+00:00"} {"global_step": 237104, "acc_step": 0, "speed/wps": 5519.25945916567, "speed/FLOPS": 243923017964274.22, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.04735341668128967, "optim/lr": 6.729086004245932e-06, "optim/total_tokens": 1988972511232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2685586214065552, "created_at": "2025-06-03T09:39:10.800292+00:00"} {"global_step": 237105, "acc_step": 0, "speed/wps": 5513.087658746752, "speed/FLOPS": 243650255975896.28, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05082174018025398, "optim/lr": 6.7255387791516074e-06, "optim/total_tokens": 1988980899840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.260918140411377, "created_at": "2025-06-03T09:39:13.780868+00:00"} {"global_step": 237106, "acc_step": 0, "speed/wps": 5516.904293889889, "speed/FLOPS": 243818931713913.38, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.05024264007806778, "optim/lr": 6.721991554057061e-06, "optim/total_tokens": 1988989288448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.254221796989441, "created_at": "2025-06-03T09:39:16.755634+00:00"} {"global_step": 237107, "acc_step": 0, "speed/wps": 5503.932309106362, "speed/FLOPS": 243245636383118.6, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.0474424734711647, "optim/lr": 6.718444328962514e-06, "optim/total_tokens": 1988997677056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2602336406707764, "created_at": "2025-06-03T09:39:19.737189+00:00"} {"global_step": 237108, "acc_step": 0, "speed/wps": 5522.032966301333, "speed/FLOPS": 244045592783574.06, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04713146761059761, "optim/lr": 6.714897103867967e-06, "optim/total_tokens": 1989006065664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.264577031135559, "created_at": "2025-06-03T09:39:22.709060+00:00"} {"global_step": 237109, "acc_step": 0, "speed/wps": 5518.460378056978, "speed/FLOPS": 243887702669337.9, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04853292182087898, "optim/lr": 6.711349878773643e-06, "optim/total_tokens": 1989014454272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2582578659057617, "created_at": "2025-06-03T09:39:25.684353+00:00"} {"global_step": 237110, "acc_step": 0, "speed/wps": 5522.291570351207, "speed/FLOPS": 244057021758923.0, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04767156019806862, "optim/lr": 6.707802653679096e-06, "optim/total_tokens": 1989022842880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2614123821258545, "created_at": "2025-06-03T09:39:28.659370+00:00"} {"global_step": 237111, "acc_step": 0, "speed/wps": 5512.115735583506, "speed/FLOPS": 243607301946834.53, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049651969224214554, "optim/lr": 6.704255428584549e-06, "optim/total_tokens": 1989031231488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2619959115982056, "created_at": "2025-06-03T09:39:31.638530+00:00"} {"global_step": 237112, "acc_step": 0, "speed/wps": 5525.796182979349, "speed/FLOPS": 244211907698853.3, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04940423741936684, "optim/lr": 6.700708203490225e-06, "optim/total_tokens": 1989039620096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2705103158950806, "created_at": "2025-06-03T09:39:34.609874+00:00"} {"global_step": 237113, "acc_step": 0, "speed/wps": 5524.384114389001, "speed/FLOPS": 244149501494782.2, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04731806367635727, "optim/lr": 6.697160978395678e-06, "optim/total_tokens": 1989048008704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2476762533187866, "created_at": "2025-06-03T09:39:37.580480+00:00"} {"global_step": 237114, "acc_step": 0, "speed/wps": 5526.1547211366815, "speed/FLOPS": 244227753250242.75, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04858654737472534, "optim/lr": 6.693613753301131e-06, "optim/total_tokens": 1989056397312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2553555965423584, "created_at": "2025-06-03T09:39:40.549914+00:00"} {"global_step": 237115, "acc_step": 0, "speed/wps": 5508.91077136099, "speed/FLOPS": 243465658932693.34, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050065070390701294, "optim/lr": 6.690066528206584e-06, "optim/total_tokens": 1989064785920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2591240406036377, "created_at": "2025-06-03T09:39:43.528717+00:00"} {"global_step": 237116, "acc_step": 0, "speed/wps": 5502.882970483108, "speed/FLOPS": 243199260986972.72, "speed/curr_iter_time": 2.9765, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9765, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.56 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.56, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04728686064481735, "optim/lr": 6.6865193031122595e-06, "optim/total_tokens": 1989073174528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2556535005569458, "created_at": "2025-06-03T09:39:46.510553+00:00"} {"global_step": 237117, "acc_step": 0, "speed/wps": 5526.930173772114, "speed/FLOPS": 244262024287602.5, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050240013748407364, "optim/lr": 6.682972078017713e-06, "optim/total_tokens": 1989081563136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2580281496047974, "created_at": "2025-06-03T09:39:49.483894+00:00"} {"global_step": 237118, "acc_step": 0, "speed/wps": 5528.056661994754, "speed/FLOPS": 244311809301153.75, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049190204590559006, "optim/lr": 6.679424852923166e-06, "optim/total_tokens": 1989089951744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2603139877319336, "created_at": "2025-06-03T09:39:52.453953+00:00"} {"global_step": 237119, "acc_step": 0, "speed/wps": 5511.768834917672, "speed/FLOPS": 243591970713003.28, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04688799008727074, "optim/lr": 6.6758776278286195e-06, "optim/total_tokens": 1989098340352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2730271816253662, "created_at": "2025-06-03T09:39:55.432439+00:00"} {"global_step": 237120, "acc_step": 0, "speed/wps": 5528.668895605795, "speed/FLOPS": 244338866893066.06, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046505048871040344, "optim/lr": 6.672330402734295e-06, "optim/total_tokens": 1989106728960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2619298696517944, "created_at": "2025-06-03T09:39:58.401317+00:00"} {"global_step": 237121, "acc_step": 0, "speed/wps": 5518.569714528677, "speed/FLOPS": 243892534781752.22, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04895658791065216, "optim/lr": 6.668783177639748e-06, "optim/total_tokens": 1989115117568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2584091424942017, "created_at": "2025-06-03T09:40:01.374874+00:00"} {"global_step": 237122, "acc_step": 0, "speed/wps": 5521.864931460244, "speed/FLOPS": 244038166503678.25, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05086557939648628, "optim/lr": 6.665235952545201e-06, "optim/total_tokens": 1989123506176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2639962434768677, "created_at": "2025-06-03T09:40:04.348333+00:00"} {"global_step": 237123, "acc_step": 0, "speed/wps": 5520.449995894852, "speed/FLOPS": 243975633593984.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049310315400362015, "optim/lr": 6.661688727450654e-06, "optim/total_tokens": 1989131894784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2629332542419434, "created_at": "2025-06-03T09:40:07.320478+00:00"} {"global_step": 237124, "acc_step": 0, "speed/wps": 5498.495894897345, "speed/FLOPS": 243005374701170.5, "speed/curr_iter_time": 2.9789, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9789, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04784274473786354, "optim/lr": 6.65814150235633e-06, "optim/total_tokens": 1989140283392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.246331810951233, "created_at": "2025-06-03T09:40:10.304468+00:00"} {"global_step": 237125, "acc_step": 0, "speed/wps": 5513.8861009268985, "speed/FLOPS": 243685543033461.22, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0481908917427063, "optim/lr": 6.654594277261783e-06, "optim/total_tokens": 1989148672000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2611392736434937, "created_at": "2025-06-03T09:40:13.284322+00:00"} {"global_step": 237126, "acc_step": 0, "speed/wps": 5516.194514996471, "speed/FLOPS": 243787563119802.03, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04732392728328705, "optim/lr": 6.651047052167236e-06, "optim/total_tokens": 1989157060608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.284773349761963, "created_at": "2025-06-03T09:40:16.259185+00:00"} {"global_step": 237127, "acc_step": 0, "speed/wps": 5519.616241637257, "speed/FLOPS": 243938785923340.12, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04718135669827461, "optim/lr": 6.64749982707269e-06, "optim/total_tokens": 1989165449216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2673101425170898, "created_at": "2025-06-03T09:40:19.236223+00:00"} {"global_step": 237128, "acc_step": 0, "speed/wps": 5515.039172764372, "speed/FLOPS": 243736502906720.84, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04759781062602997, "optim/lr": 6.643952601978364e-06, "optim/total_tokens": 1989173837824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2803517580032349, "created_at": "2025-06-03T09:40:22.216766+00:00"} {"global_step": 237129, "acc_step": 0, "speed/wps": 5511.059991305411, "speed/FLOPS": 243560643453531.84, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046865612268447876, "optim/lr": 6.640405376883818e-06, "optim/total_tokens": 1989182226432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.253179907798767, "created_at": "2025-06-03T09:40:25.194505+00:00"} {"global_step": 237130, "acc_step": 0, "speed/wps": 5503.628381712536, "speed/FLOPS": 243232204347952.9, "speed/curr_iter_time": 2.9761, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9761, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.55 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.55, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0463167279958725, "optim/lr": 6.6368581517892715e-06, "optim/total_tokens": 1989190615040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2540215253829956, "created_at": "2025-06-03T09:40:28.176335+00:00"} {"global_step": 237131, "acc_step": 0, "speed/wps": 5508.249397926168, "speed/FLOPS": 243436429612090.3, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04742920771241188, "optim/lr": 6.633310926694724e-06, "optim/total_tokens": 1989199003648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2581804990768433, "created_at": "2025-06-03T09:40:31.155850+00:00"} {"global_step": 237132, "acc_step": 0, "speed/wps": 5515.010415190482, "speed/FLOPS": 243735231969149.5, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04722116142511368, "optim/lr": 6.6297637016004e-06, "optim/total_tokens": 1989207392256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2615606784820557, "created_at": "2025-06-03T09:40:34.131634+00:00"} {"global_step": 237133, "acc_step": 0, "speed/wps": 5505.925671344725, "speed/FLOPS": 243333732791101.38, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04775356128811836, "optim/lr": 6.626216476505853e-06, "optim/total_tokens": 1989215780864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.259220004081726, "created_at": "2025-06-03T09:40:37.117787+00:00"} {"global_step": 237134, "acc_step": 0, "speed/wps": 5512.692500540328, "speed/FLOPS": 243632792005775.4, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04727239906787872, "optim/lr": 6.622669251411306e-06, "optim/total_tokens": 1989224169472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2712806463241577, "created_at": "2025-06-03T09:40:40.097279+00:00"} {"global_step": 237135, "acc_step": 0, "speed/wps": 5523.42759228777, "speed/FLOPS": 244107228113831.7, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046078167855739594, "optim/lr": 6.61912202631676e-06, "optim/total_tokens": 1989232558080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2705066204071045, "created_at": "2025-06-03T09:40:43.068106+00:00"} {"global_step": 237136, "acc_step": 0, "speed/wps": 5510.5244886732835, "speed/FLOPS": 243536976978142.75, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049493394792079926, "optim/lr": 6.6155748012224344e-06, "optim/total_tokens": 1989240946688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2700165510177612, "created_at": "2025-06-03T09:40:46.048989+00:00"} {"global_step": 237137, "acc_step": 0, "speed/wps": 5513.119171430988, "speed/FLOPS": 243651648675243.0, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04658233001828194, "optim/lr": 6.612027576127888e-06, "optim/total_tokens": 1989249335296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2599427700042725, "created_at": "2025-06-03T09:40:49.029499+00:00"} {"global_step": 237138, "acc_step": 0, "speed/wps": 5513.274641813326, "speed/FLOPS": 243658519670372.75, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048491038382053375, "optim/lr": 6.608480351033342e-06, "optim/total_tokens": 1989257723904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2524821758270264, "created_at": "2025-06-03T09:40:52.005625+00:00"} {"global_step": 237139, "acc_step": 0, "speed/wps": 5516.613498516861, "speed/FLOPS": 243806080046851.2, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048235002905130386, "optim/lr": 6.604933125939016e-06, "optim/total_tokens": 1989266112512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2520936727523804, "created_at": "2025-06-03T09:40:54.980841+00:00"} {"global_step": 237140, "acc_step": 0, "speed/wps": 5503.4734720986835, "speed/FLOPS": 243225358135919.9, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.54 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.54, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04657423123717308, "optim/lr": 6.60138590084447e-06, "optim/total_tokens": 1989274501120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2631479501724243, "created_at": "2025-06-03T09:40:57.962947+00:00"} {"global_step": 237141, "acc_step": 0, "speed/wps": 5516.16108962781, "speed/FLOPS": 243786085889593.72, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05203515291213989, "optim/lr": 6.5978386757499235e-06, "optim/total_tokens": 1989282889728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2587568759918213, "created_at": "2025-06-03T09:41:00.938062+00:00"} {"global_step": 237142, "acc_step": 0, "speed/wps": 5520.634963637383, "speed/FLOPS": 243983808221453.8, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047053638845682144, "optim/lr": 6.594291450655376e-06, "optim/total_tokens": 1989291278336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.269445538520813, "created_at": "2025-06-03T09:41:03.911189+00:00"} {"global_step": 237143, "acc_step": 0, "speed/wps": 5535.050205766883, "speed/FLOPS": 244620888139679.8, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046448804438114166, "optim/lr": 6.590744225561052e-06, "optim/total_tokens": 1989299666944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2639586925506592, "created_at": "2025-06-03T09:41:06.875357+00:00"} {"global_step": 237144, "acc_step": 0, "speed/wps": 5527.685999406003, "speed/FLOPS": 244295427911954.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05158146098256111, "optim/lr": 6.587197000466505e-06, "optim/total_tokens": 1989308055552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2760002613067627, "created_at": "2025-06-03T09:41:09.848398+00:00"} {"global_step": 237145, "acc_step": 0, "speed/wps": 5527.940505769788, "speed/FLOPS": 244306675790551.7, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04851995408535004, "optim/lr": 6.583649775371958e-06, "optim/total_tokens": 1989316444160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.259122371673584, "created_at": "2025-06-03T09:41:12.821056+00:00"} {"global_step": 237146, "acc_step": 0, "speed/wps": 5522.131025726901, "speed/FLOPS": 244049926508270.53, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04736834764480591, "optim/lr": 6.580102550277412e-06, "optim/total_tokens": 1989324832768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2753629684448242, "created_at": "2025-06-03T09:41:15.794480+00:00"} {"global_step": 237147, "acc_step": 0, "speed/wps": 5519.103662324419, "speed/FLOPS": 243916132541331.44, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0515054352581501, "optim/lr": 6.5765553251830865e-06, "optim/total_tokens": 1989333221376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2612724304199219, "created_at": "2025-06-03T09:41:18.772851+00:00"} {"global_step": 237148, "acc_step": 0, "speed/wps": 5521.020223287914, "speed/FLOPS": 244000834726069.62, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04979335144162178, "optim/lr": 6.57300810008854e-06, "optim/total_tokens": 1989341609984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.263537883758545, "created_at": "2025-06-03T09:41:21.745591+00:00"} {"global_step": 237149, "acc_step": 0, "speed/wps": 5517.346282359607, "speed/FLOPS": 243838465341972.84, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.53 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.53, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04863373190164566, "optim/lr": 6.569460874993993e-06, "optim/total_tokens": 1989349998592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2463122606277466, "created_at": "2025-06-03T09:41:24.719256+00:00"} {"global_step": 237150, "acc_step": 0, "speed/wps": 5526.680976947904, "speed/FLOPS": 244251011063477.38, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04940292239189148, "optim/lr": 6.5659136498994465e-06, "optim/total_tokens": 1989358387200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2597142457962036, "created_at": "2025-06-03T09:41:27.688530+00:00"} {"global_step": 237151, "acc_step": 0, "speed/wps": 5524.175413970979, "speed/FLOPS": 244140278004531.2, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04823746904730797, "optim/lr": 6.562366424805122e-06, "optim/total_tokens": 1989366775808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2653931379318237, "created_at": "2025-06-03T09:41:30.662825+00:00"} {"global_step": 237152, "acc_step": 0, "speed/wps": 5525.051483101481, "speed/FLOPS": 244178995775971.03, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048116277903318405, "optim/lr": 6.558819199710575e-06, "optim/total_tokens": 1989375164416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.264870524406433, "created_at": "2025-06-03T09:41:33.632873+00:00"} {"global_step": 237153, "acc_step": 0, "speed/wps": 5521.033574068269, "speed/FLOPS": 244001424762225.84, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04800385609269142, "optim/lr": 6.555271974616028e-06, "optim/total_tokens": 1989383553024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2696503400802612, "created_at": "2025-06-03T09:41:36.605189+00:00"} {"global_step": 237154, "acc_step": 0, "speed/wps": 5532.962802314737, "speed/FLOPS": 244528635591394.38, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046960581094026566, "optim/lr": 6.551724749521482e-06, "optim/total_tokens": 1989391941632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2550886869430542, "created_at": "2025-06-03T09:41:39.571410+00:00"} {"global_step": 237155, "acc_step": 0, "speed/wps": 5520.920782126661, "speed/FLOPS": 243996439935728.25, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046804606914520264, "optim/lr": 6.548177524427157e-06, "optim/total_tokens": 1989400330240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2549774646759033, "created_at": "2025-06-03T09:41:42.545299+00:00"} {"global_step": 237156, "acc_step": 0, "speed/wps": 5514.168058930845, "speed/FLOPS": 243698004134043.78, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04699241742491722, "optim/lr": 6.54463029933261e-06, "optim/total_tokens": 1989408718848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2579057216644287, "created_at": "2025-06-03T09:41:45.522201+00:00"} {"global_step": 237157, "acc_step": 0, "speed/wps": 5522.701161834619, "speed/FLOPS": 244075123606010.53, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04887226223945618, "optim/lr": 6.541083074238063e-06, "optim/total_tokens": 1989417107456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2771492004394531, "created_at": "2025-06-03T09:41:48.493766+00:00"} {"global_step": 237158, "acc_step": 0, "speed/wps": 5505.941006327609, "speed/FLOPS": 243334410518853.3, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04710545018315315, "optim/lr": 6.537535849143517e-06, "optim/total_tokens": 1989425496064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2663326263427734, "created_at": "2025-06-03T09:41:51.473632+00:00"} {"global_step": 237159, "acc_step": 0, "speed/wps": 5510.16085221969, "speed/FLOPS": 243520906108154.0, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046765174716711044, "optim/lr": 6.533988624049192e-06, "optim/total_tokens": 1989433884672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2665013074874878, "created_at": "2025-06-03T09:41:54.453712+00:00"} {"global_step": 237160, "acc_step": 0, "speed/wps": 5524.113332814993, "speed/FLOPS": 244137534335196.75, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.52 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.52, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04819946736097336, "optim/lr": 6.530441398954645e-06, "optim/total_tokens": 1989442273280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2548140287399292, "created_at": "2025-06-03T09:41:57.428225+00:00"} {"global_step": 237161, "acc_step": 0, "speed/wps": 5529.810495496971, "speed/FLOPS": 244389319765018.1, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04769952967762947, "optim/lr": 6.5268941738600985e-06, "optim/total_tokens": 1989450661888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2527170181274414, "created_at": "2025-06-03T09:42:00.399503+00:00"} {"global_step": 237162, "acc_step": 0, "speed/wps": 5521.703101409229, "speed/FLOPS": 244031014443744.66, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04769060015678406, "optim/lr": 6.523346948765551e-06, "optim/total_tokens": 1989459050496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.247275710105896, "created_at": "2025-06-03T09:42:03.374509+00:00"} {"global_step": 237163, "acc_step": 0, "speed/wps": 5529.0963645839, "speed/FLOPS": 244357758833913.72, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047110751271247864, "optim/lr": 6.519799723671227e-06, "optim/total_tokens": 1989467439104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2745152711868286, "created_at": "2025-06-03T09:42:06.342021+00:00"} {"global_step": 237164, "acc_step": 0, "speed/wps": 5525.736531304014, "speed/FLOPS": 244209271400128.44, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04736676812171936, "optim/lr": 6.51625249857668e-06, "optim/total_tokens": 1989475827712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2744989395141602, "created_at": "2025-06-03T09:42:09.311548+00:00"} {"global_step": 237165, "acc_step": 0, "speed/wps": 5516.380676630491, "speed/FLOPS": 243795790511164.06, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0475928969681263, "optim/lr": 6.512705273482133e-06, "optim/total_tokens": 1989484216320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2724462747573853, "created_at": "2025-06-03T09:42:12.291541+00:00"} {"global_step": 237166, "acc_step": 0, "speed/wps": 5512.3230175258095, "speed/FLOPS": 243616462747719.22, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047192540019750595, "optim/lr": 6.509158048387587e-06, "optim/total_tokens": 1989492604928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2526952028274536, "created_at": "2025-06-03T09:42:15.271966+00:00"} {"global_step": 237167, "acc_step": 0, "speed/wps": 5516.7305134604085, "speed/FLOPS": 243811251508419.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0475514754652977, "optim/lr": 6.505610823293262e-06, "optim/total_tokens": 1989500993536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2775861024856567, "created_at": "2025-06-03T09:42:18.250110+00:00"} {"global_step": 237168, "acc_step": 0, "speed/wps": 5524.901308383001, "speed/FLOPS": 244172358822078.16, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04666389152407646, "optim/lr": 6.502063598198715e-06, "optim/total_tokens": 1989509382144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2573591470718384, "created_at": "2025-06-03T09:42:21.224212+00:00"} {"global_step": 237169, "acc_step": 0, "speed/wps": 5527.461480070392, "speed/FLOPS": 244285505306514.22, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046770915389060974, "optim/lr": 6.498516373104169e-06, "optim/total_tokens": 1989517770752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2489246129989624, "created_at": "2025-06-03T09:42:24.195958+00:00"} {"global_step": 237170, "acc_step": 0, "speed/wps": 5517.979672960877, "speed/FLOPS": 243866457964561.97, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04779161512851715, "optim/lr": 6.494969148009844e-06, "optim/total_tokens": 1989526159360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2480790615081787, "created_at": "2025-06-03T09:42:27.173816+00:00"} {"global_step": 237171, "acc_step": 0, "speed/wps": 5516.611407047809, "speed/FLOPS": 243805987614624.2, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05069592595100403, "optim/lr": 6.491421922915297e-06, "optim/total_tokens": 1989534547968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2610620260238647, "created_at": "2025-06-03T09:42:30.148350+00:00"} {"global_step": 237172, "acc_step": 0, "speed/wps": 5536.973118359428, "speed/FLOPS": 244705871033911.4, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 194.89, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04690887778997421, "optim/lr": 6.4878746978207505e-06, "optim/total_tokens": 1989542936576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2934638261795044, "created_at": "2025-06-03T09:42:33.111428+00:00"} {"global_step": 237173, "acc_step": 0, "speed/wps": 5518.605405327693, "speed/FLOPS": 243894112132386.66, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047614239156246185, "optim/lr": 6.484327472726203e-06, "optim/total_tokens": 1989551325184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2571760416030884, "created_at": "2025-06-03T09:42:36.090131+00:00"} {"global_step": 237174, "acc_step": 0, "speed/wps": 5506.250957497576, "speed/FLOPS": 243348108774091.94, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04730302467942238, "optim/lr": 6.480780247631879e-06, "optim/total_tokens": 1989559713792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.249208927154541, "created_at": "2025-06-03T09:42:39.069775+00:00"} {"global_step": 237175, "acc_step": 0, "speed/wps": 5509.294485623452, "speed/FLOPS": 243482617139066.5, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.51 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.51, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048206400126218796, "optim/lr": 6.4772330225373324e-06, "optim/total_tokens": 1989568102400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.266244649887085, "created_at": "2025-06-03T09:42:42.047570+00:00"} {"global_step": 237176, "acc_step": 0, "speed/wps": 5531.026619479996, "speed/FLOPS": 244443066220380.97, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04667995125055313, "optim/lr": 6.473685797442785e-06, "optim/total_tokens": 1989576491008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2583492994308472, "created_at": "2025-06-03T09:42:45.018535+00:00"} {"global_step": 237177, "acc_step": 0, "speed/wps": 5518.256705914633, "speed/FLOPS": 243878701403134.8, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048630569130182266, "optim/lr": 6.470138572348239e-06, "optim/total_tokens": 1989584879616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2552522420883179, "created_at": "2025-06-03T09:42:47.995633+00:00"} {"global_step": 237178, "acc_step": 0, "speed/wps": 5522.045330084424, "speed/FLOPS": 244046139199503.12, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.053099241107702255, "optim/lr": 6.466591347253914e-06, "optim/total_tokens": 1989593268224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.257622241973877, "created_at": "2025-06-03T09:42:50.966638+00:00"} {"global_step": 237179, "acc_step": 0, "speed/wps": 5524.723873015051, "speed/FLOPS": 244164517087011.28, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04725505784153938, "optim/lr": 6.463044122159367e-06, "optim/total_tokens": 1989601656832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2559102773666382, "created_at": "2025-06-03T09:42:53.939853+00:00"} {"global_step": 237180, "acc_step": 0, "speed/wps": 5527.820051556746, "speed/FLOPS": 244301352330875.8, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04941292852163315, "optim/lr": 6.459496897064821e-06, "optim/total_tokens": 1989610045440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.271036148071289, "created_at": "2025-06-03T09:42:56.907945+00:00"} {"global_step": 237181, "acc_step": 0, "speed/wps": 5514.666979151963, "speed/FLOPS": 243720053854111.97, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048740874975919724, "optim/lr": 6.4559496719702735e-06, "optim/total_tokens": 1989618434048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2602843046188354, "created_at": "2025-06-03T09:42:59.886986+00:00"} {"global_step": 237182, "acc_step": 0, "speed/wps": 5511.020896440916, "speed/FLOPS": 243558915660626.78, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0493285246193409, "optim/lr": 6.452402446875949e-06, "optim/total_tokens": 1989626822656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2720654010772705, "created_at": "2025-06-03T09:43:02.865684+00:00"} {"global_step": 237183, "acc_step": 0, "speed/wps": 5510.807265190685, "speed/FLOPS": 243549474252830.47, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.5 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.5, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050361789762973785, "optim/lr": 6.448855221781403e-06, "optim/total_tokens": 1989635211264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2608877420425415, "created_at": "2025-06-03T09:43:05.845202+00:00"} {"global_step": 237184, "acc_step": 0, "speed/wps": 5533.440754383036, "speed/FLOPS": 244549758626432.75, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04636243358254433, "optim/lr": 6.445307996686855e-06, "optim/total_tokens": 1989643599872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.254905104637146, "created_at": "2025-06-03T09:43:08.810301+00:00"} {"global_step": 237185, "acc_step": 0, "speed/wps": 5535.235689501223, "speed/FLOPS": 244629085571345.8, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04779551550745964, "optim/lr": 6.441760771592309e-06, "optim/total_tokens": 1989651988480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2589774131774902, "created_at": "2025-06-03T09:43:11.780246+00:00"} {"global_step": 237186, "acc_step": 0, "speed/wps": 5524.8287761599295, "speed/FLOPS": 244169153269071.94, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04936334490776062, "optim/lr": 6.4382135464979845e-06, "optim/total_tokens": 1989660377088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2746241092681885, "created_at": "2025-06-03T09:43:14.753207+00:00"} {"global_step": 237187, "acc_step": 0, "speed/wps": 5526.190337389081, "speed/FLOPS": 244229327306298.3, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046878013759851456, "optim/lr": 6.434666321403437e-06, "optim/total_tokens": 1989668765696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.25336754322052, "created_at": "2025-06-03T09:43:17.722375+00:00"} {"global_step": 237188, "acc_step": 0, "speed/wps": 5525.958650103196, "speed/FLOPS": 244219087914145.25, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04776187986135483, "optim/lr": 6.431119096308891e-06, "optim/total_tokens": 1989677154304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.280991554260254, "created_at": "2025-06-03T09:43:20.691948+00:00"} {"global_step": 237189, "acc_step": 0, "speed/wps": 5521.0682159646285, "speed/FLOPS": 244002955756731.62, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047452203929424286, "optim/lr": 6.427571871214344e-06, "optim/total_tokens": 1989685542912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2557711601257324, "created_at": "2025-06-03T09:43:23.669580+00:00"} {"global_step": 237190, "acc_step": 0, "speed/wps": 5511.692823453626, "speed/FLOPS": 243588611395354.38, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046630267053842545, "optim/lr": 6.424024646120019e-06, "optim/total_tokens": 1989693931520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.283054232597351, "created_at": "2025-06-03T09:43:26.647152+00:00"} {"global_step": 237191, "acc_step": 0, "speed/wps": 5510.930462019439, "speed/FLOPS": 243554918922082.84, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04698364436626434, "optim/lr": 6.420477421025473e-06, "optim/total_tokens": 1989702320128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2696200609207153, "created_at": "2025-06-03T09:43:29.628181+00:00"} {"global_step": 237192, "acc_step": 0, "speed/wps": 5532.968775944972, "speed/FLOPS": 244528899595274.94, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047592394053936005, "optim/lr": 6.4169301959309255e-06, "optim/total_tokens": 1989710708736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2662352323532104, "created_at": "2025-06-03T09:43:32.597714+00:00"} {"global_step": 237193, "acc_step": 0, "speed/wps": 5518.618950874322, "speed/FLOPS": 243894710776215.25, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047287195920944214, "optim/lr": 6.413382970836379e-06, "optim/total_tokens": 1989719097344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2576730251312256, "created_at": "2025-06-03T09:43:35.570822+00:00"} {"global_step": 237194, "acc_step": 0, "speed/wps": 5527.928639720211, "speed/FLOPS": 244306151371896.38, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047479648143053055, "optim/lr": 6.409835745742054e-06, "optim/total_tokens": 1989727485952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2497321367263794, "created_at": "2025-06-03T09:43:38.539366+00:00"} {"global_step": 237195, "acc_step": 0, "speed/wps": 5532.88467558837, "speed/FLOPS": 244525182789977.78, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.05, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04963678866624832, "optim/lr": 6.406288520647507e-06, "optim/total_tokens": 1989735874560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2626348733901978, "created_at": "2025-06-03T09:43:41.510246+00:00"} {"global_step": 237196, "acc_step": 0, "speed/wps": 5525.297207163049, "speed/FLOPS": 244189855521762.62, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04719075560569763, "optim/lr": 6.402741295552961e-06, "optim/total_tokens": 1989744263168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2657479047775269, "created_at": "2025-06-03T09:43:44.484530+00:00"} {"global_step": 237197, "acc_step": 0, "speed/wps": 5517.349600791647, "speed/FLOPS": 243838611999683.75, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04772033914923668, "optim/lr": 6.399194070458636e-06, "optim/total_tokens": 1989752651776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2604573965072632, "created_at": "2025-06-03T09:43:47.463307+00:00"} {"global_step": 237198, "acc_step": 0, "speed/wps": 5506.003188499393, "speed/FLOPS": 243337158652568.97, "speed/curr_iter_time": 2.9747, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9747, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04796910658478737, "optim/lr": 6.395646845364089e-06, "optim/total_tokens": 1989761040384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2660868167877197, "created_at": "2025-06-03T09:43:50.446309+00:00"} {"global_step": 237199, "acc_step": 0, "speed/wps": 5512.749476179099, "speed/FLOPS": 243635310037381.3, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.49 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.49, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04707544296979904, "optim/lr": 6.392099620269543e-06, "optim/total_tokens": 1989769428992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2667347192764282, "created_at": "2025-06-03T09:43:53.422670+00:00"} {"global_step": 237200, "acc_step": 0, "speed/wps": 5523.695956575541, "speed/FLOPS": 244119088441738.22, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04766606539487839, "optim/lr": 6.388552395174996e-06, "optim/total_tokens": 1989777817600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.268747091293335, "created_at": "2025-06-03T09:43:56.394957+00:00"} {"global_step": 237201, "acc_step": 0, "speed/wps": 5534.4584840377565, "speed/FLOPS": 244594737067958.8, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.0, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049100227653980255, "optim/lr": 6.385005170080671e-06, "optim/total_tokens": 1989786206208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2741854190826416, "created_at": "2025-06-03T09:43:59.359648+00:00"} {"global_step": 237202, "acc_step": 0, "speed/wps": 5540.901200887421, "speed/FLOPS": 244879472175899.7, "speed/curr_iter_time": 2.956, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.956, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 194.77, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04685455188155174, "optim/lr": 6.381457944986124e-06, "optim/total_tokens": 1989794594816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.26079261302948, "created_at": "2025-06-03T09:44:02.320867+00:00"} {"global_step": 237203, "acc_step": 0, "speed/wps": 5520.094262242636, "speed/FLOPS": 243959911987366.62, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05057491734623909, "optim/lr": 6.3779107198915775e-06, "optim/total_tokens": 1989802983424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2752987146377563, "created_at": "2025-06-03T09:44:05.293974+00:00"} {"global_step": 237204, "acc_step": 0, "speed/wps": 5516.140787265281, "speed/FLOPS": 243785188629086.88, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04759979993104935, "optim/lr": 6.374363494797031e-06, "optim/total_tokens": 1989811372032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2699334621429443, "created_at": "2025-06-03T09:44:08.270905+00:00"} {"global_step": 237205, "acc_step": 0, "speed/wps": 5508.831390348714, "speed/FLOPS": 243462150698259.6, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04697069525718689, "optim/lr": 6.370816269702706e-06, "optim/total_tokens": 1989819760640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.253719449043274, "created_at": "2025-06-03T09:44:11.254791+00:00"} {"global_step": 237206, "acc_step": 0, "speed/wps": 5512.24377174659, "speed/FLOPS": 243612960489894.38, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04704682528972626, "optim/lr": 6.3672690446081594e-06, "optim/total_tokens": 1989828149248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.265457034111023, "created_at": "2025-06-03T09:44:14.232963+00:00"} {"global_step": 237207, "acc_step": 0, "speed/wps": 5500.662761933113, "speed/FLOPS": 243101139133120.5, "speed/curr_iter_time": 2.9777, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9777, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04703613743185997, "optim/lr": 6.363721819513613e-06, "optim/total_tokens": 1989836537856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2605465650558472, "created_at": "2025-06-03T09:44:17.220536+00:00"} {"global_step": 237208, "acc_step": 0, "speed/wps": 5501.382717336914, "speed/FLOPS": 243132957476902.66, "speed/curr_iter_time": 2.9773, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9773, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04747112840414047, "optim/lr": 6.360174594419066e-06, "optim/total_tokens": 1989844926464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2468836307525635, "created_at": "2025-06-03T09:44:20.206150+00:00"} {"global_step": 237209, "acc_step": 0, "speed/wps": 5515.605674212479, "speed/FLOPS": 243761539371109.94, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.48 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.48, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046269893646240234, "optim/lr": 6.356627369324741e-06, "optim/total_tokens": 1989853315072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2549524307250977, "created_at": "2025-06-03T09:44:23.183220+00:00"} {"global_step": 237210, "acc_step": 0, "speed/wps": 5532.674158785948, "speed/FLOPS": 244515879024833.4, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04708833619952202, "optim/lr": 6.353080144230194e-06, "optim/total_tokens": 1989861703680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2662540674209595, "created_at": "2025-06-03T09:44:26.149996+00:00"} {"global_step": 237211, "acc_step": 0, "speed/wps": 5536.735263096003, "speed/FLOPS": 244695359048721.66, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 194.93, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04750756919384003, "optim/lr": 6.349532919135648e-06, "optim/total_tokens": 1989870092288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.254624366760254, "created_at": "2025-06-03T09:44:29.113554+00:00"} {"global_step": 237212, "acc_step": 0, "speed/wps": 5530.699221109973, "speed/FLOPS": 244428596888202.75, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.14, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04743459075689316, "optim/lr": 6.345985694041101e-06, "optim/total_tokens": 1989878480896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2526158094406128, "created_at": "2025-06-03T09:44:32.083105+00:00"} {"global_step": 237213, "acc_step": 0, "speed/wps": 5524.105398656216, "speed/FLOPS": 244137183685989.5, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04631698131561279, "optim/lr": 6.342438468946776e-06, "optim/total_tokens": 1989886869504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.268617033958435, "created_at": "2025-06-03T09:44:35.055790+00:00"} {"global_step": 237214, "acc_step": 0, "speed/wps": 5516.567552299809, "speed/FLOPS": 243804049459231.53, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046899788081645966, "optim/lr": 6.33889124385223e-06, "optim/total_tokens": 1989895258112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2595995664596558, "created_at": "2025-06-03T09:44:38.033532+00:00"} {"global_step": 237215, "acc_step": 0, "speed/wps": 5518.412612899921, "speed/FLOPS": 243885591693880.25, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04673650488257408, "optim/lr": 6.335344018757682e-06, "optim/total_tokens": 1989903646720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2568808794021606, "created_at": "2025-06-03T09:44:41.007417+00:00"} {"global_step": 237216, "acc_step": 0, "speed/wps": 5531.412810458812, "speed/FLOPS": 244460133884940.0, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0469391867518425, "optim/lr": 6.331796793663136e-06, "optim/total_tokens": 1989912035328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2662551403045654, "created_at": "2025-06-03T09:44:43.973723+00:00"} {"global_step": 237217, "acc_step": 0, "speed/wps": 5517.085038984998, "speed/FLOPS": 243826919721979.94, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04666753485798836, "optim/lr": 6.3282495685688115e-06, "optim/total_tokens": 1989920423936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2454735040664673, "created_at": "2025-06-03T09:44:46.948167+00:00"} {"global_step": 237218, "acc_step": 0, "speed/wps": 5527.91750500434, "speed/FLOPS": 244305659274447.47, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04754667356610298, "optim/lr": 6.324702343474264e-06, "optim/total_tokens": 1989928812544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2700684070587158, "created_at": "2025-06-03T09:44:49.921855+00:00"} {"global_step": 237219, "acc_step": 0, "speed/wps": 5518.005032811986, "speed/FLOPS": 243867578740177.5, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050391167402267456, "optim/lr": 6.321155118379718e-06, "optim/total_tokens": 1989937201152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2685002088546753, "created_at": "2025-06-03T09:44:52.900897+00:00"} {"global_step": 237220, "acc_step": 0, "speed/wps": 5531.144296670437, "speed/FLOPS": 244448266949872.0, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.04, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046696580946445465, "optim/lr": 6.3176078932851715e-06, "optim/total_tokens": 1989945589760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2681288719177246, "created_at": "2025-06-03T09:44:55.870407+00:00"} {"global_step": 237221, "acc_step": 0, "speed/wps": 5539.19009181969, "speed/FLOPS": 244803849913356.16, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 194.85, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05006172135472298, "optim/lr": 6.314060668190846e-06, "optim/total_tokens": 1989953978368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2575595378875732, "created_at": "2025-06-03T09:44:58.832781+00:00"} {"global_step": 237222, "acc_step": 0, "speed/wps": 5528.33417092029, "speed/FLOPS": 244324073775242.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04822850972414017, "optim/lr": 6.3105134430963e-06, "optim/total_tokens": 1989962366976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2651854753494263, "created_at": "2025-06-03T09:45:01.806002+00:00"} {"global_step": 237223, "acc_step": 0, "speed/wps": 5528.283207102194, "speed/FLOPS": 244321821435339.62, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04859766364097595, "optim/lr": 6.3069662180017525e-06, "optim/total_tokens": 1989970755584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.249165415763855, "created_at": "2025-06-03T09:45:04.777807+00:00"} {"global_step": 237224, "acc_step": 0, "speed/wps": 5514.923447538611, "speed/FLOPS": 243731388444077.62, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04837938770651817, "optim/lr": 6.303418992907428e-06, "optim/total_tokens": 1989979144192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2666780948638916, "created_at": "2025-06-03T09:45:07.753574+00:00"} {"global_step": 237225, "acc_step": 0, "speed/wps": 5511.938304914782, "speed/FLOPS": 243599460419449.44, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.47 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.47, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046769384294748306, "optim/lr": 6.299871767812882e-06, "optim/total_tokens": 1989987532800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2748626470565796, "created_at": "2025-06-03T09:45:10.730340+00:00"} {"global_step": 237226, "acc_step": 0, "speed/wps": 5525.828324073547, "speed/FLOPS": 244213328170703.84, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04793478548526764, "optim/lr": 6.296324542718334e-06, "optim/total_tokens": 1989995921408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2525888681411743, "created_at": "2025-06-03T09:45:13.700459+00:00"} {"global_step": 237227, "acc_step": 0, "speed/wps": 5528.461359806164, "speed/FLOPS": 244329694872986.9, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048066142946481705, "optim/lr": 6.292777317623788e-06, "optim/total_tokens": 1990004310016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2647426128387451, "created_at": "2025-06-03T09:45:16.668222+00:00"} {"global_step": 237228, "acc_step": 0, "speed/wps": 5528.95802103754, "speed/FLOPS": 244351644757271.06, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04902603477239609, "optim/lr": 6.2892300925294635e-06, "optim/total_tokens": 1990012698624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2539247274398804, "created_at": "2025-06-03T09:45:19.639612+00:00"} {"global_step": 237229, "acc_step": 0, "speed/wps": 5519.838195566481, "speed/FLOPS": 243948595150948.62, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04705202579498291, "optim/lr": 6.285682867434916e-06, "optim/total_tokens": 1990021087232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2529878616333008, "created_at": "2025-06-03T09:45:22.612933+00:00"} {"global_step": 237230, "acc_step": 0, "speed/wps": 5528.081156101134, "speed/FLOPS": 244312891815283.56, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05147891491651535, "optim/lr": 6.28213564234037e-06, "optim/total_tokens": 1990029475840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2429944276809692, "created_at": "2025-06-03T09:45:25.584341+00:00"} {"global_step": 237231, "acc_step": 0, "speed/wps": 5525.28958804222, "speed/FLOPS": 244189518795620.16, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04844057559967041, "optim/lr": 6.278588417245823e-06, "optim/total_tokens": 1990037864448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.270005702972412, "created_at": "2025-06-03T09:45:28.555138+00:00"} {"global_step": 237232, "acc_step": 0, "speed/wps": 5517.756318250894, "speed/FLOPS": 243856586829613.78, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04712420329451561, "optim/lr": 6.275041192151498e-06, "optim/total_tokens": 1990046253056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2671951055526733, "created_at": "2025-06-03T09:45:31.530830+00:00"} {"global_step": 237233, "acc_step": 0, "speed/wps": 5518.204740319595, "speed/FLOPS": 243876404789818.12, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.049567483365535736, "optim/lr": 6.271493967056952e-06, "optim/total_tokens": 1990054641664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.249916911125183, "created_at": "2025-06-03T09:45:34.504483+00:00"} {"global_step": 237234, "acc_step": 0, "speed/wps": 5510.5888777189775, "speed/FLOPS": 243539822644389.4, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.46 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.46, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046289823949337006, "optim/lr": 6.2679467419624045e-06, "optim/total_tokens": 1990063030272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2676841020584106, "created_at": "2025-06-03T09:45:37.484881+00:00"} {"global_step": 237235, "acc_step": 0, "speed/wps": 5531.157533858014, "speed/FLOPS": 244448851965808.84, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.15, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0479857362806797, "optim/lr": 6.264399516867858e-06, "optim/total_tokens": 1990071418880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.26276695728302, "created_at": "2025-06-03T09:45:40.451785+00:00"} {"global_step": 237236, "acc_step": 0, "speed/wps": 5537.682476779914, "speed/FLOPS": 244737221045271.38, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047377459704875946, "optim/lr": 6.260852291773534e-06, "optim/total_tokens": 1990079807488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2643646001815796, "created_at": "2025-06-03T09:45:43.417847+00:00"} {"global_step": 237237, "acc_step": 0, "speed/wps": 5532.615737010874, "speed/FLOPS": 244513297081404.9, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04746589809656143, "optim/lr": 6.2573050666789864e-06, "optim/total_tokens": 1990088196096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2737553119659424, "created_at": "2025-06-03T09:45:46.385330+00:00"} {"global_step": 237238, "acc_step": 0, "speed/wps": 5527.504428368586, "speed/FLOPS": 244287403401465.03, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047319624572992325, "optim/lr": 6.25375784158444e-06, "optim/total_tokens": 1990096584704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.27000892162323, "created_at": "2025-06-03T09:45:49.356057+00:00"} {"global_step": 237239, "acc_step": 0, "speed/wps": 5530.591365600285, "speed/FLOPS": 244423830226729.06, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04710644111037254, "optim/lr": 6.250210616489893e-06, "optim/total_tokens": 1990104973312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2590805292129517, "created_at": "2025-06-03T09:45:52.325746+00:00"} {"global_step": 237240, "acc_step": 0, "speed/wps": 5524.1208389768935, "speed/FLOPS": 244137866069132.75, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04707789793610573, "optim/lr": 6.246663391395568e-06, "optim/total_tokens": 1990113361920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2597007751464844, "created_at": "2025-06-03T09:45:55.297096+00:00"} {"global_step": 237241, "acc_step": 0, "speed/wps": 5517.183433622185, "speed/FLOPS": 243831268261314.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04749913141131401, "optim/lr": 6.243116166301022e-06, "optim/total_tokens": 1990121750528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2766038179397583, "created_at": "2025-06-03T09:45:58.277753+00:00"} {"global_step": 237242, "acc_step": 0, "speed/wps": 5508.443093982741, "speed/FLOPS": 243444989986364.53, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04705534875392914, "optim/lr": 6.239568941206475e-06, "optim/total_tokens": 1990130139136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.272553563117981, "created_at": "2025-06-03T09:46:01.257241+00:00"} {"global_step": 237243, "acc_step": 0, "speed/wps": 5529.266250545499, "speed/FLOPS": 244365266923861.22, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.45 hours", "speed/est_time_elapsed_hrs": 195.13, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.45, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04838079586625099, "optim/lr": 6.236021716111928e-06, "optim/total_tokens": 1990138527744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2547826766967773, "created_at": "2025-06-03T09:46:04.224745+00:00"} {"global_step": 237244, "acc_step": 0, "speed/wps": 5535.639975986196, "speed/FLOPS": 244646952964655.8, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 194.99, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04791328310966492, "optim/lr": 6.232474491017604e-06, "optim/total_tokens": 1990146916352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2544585466384888, "created_at": "2025-06-03T09:46:07.192193+00:00"} {"global_step": 237245, "acc_step": 0, "speed/wps": 5527.977155574333, "speed/FLOPS": 244308295524321.88, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04742199182510376, "optim/lr": 6.228927265923057e-06, "optim/total_tokens": 1990155304960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2646220922470093, "created_at": "2025-06-03T09:46:10.163209+00:00"} {"global_step": 237246, "acc_step": 0, "speed/wps": 5525.416634703972, "speed/FLOPS": 244195133607785.8, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04751928150653839, "optim/lr": 6.22538004082851e-06, "optim/total_tokens": 1990163693568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2479416131973267, "created_at": "2025-06-03T09:46:13.134887+00:00"} {"global_step": 237247, "acc_step": 0, "speed/wps": 5520.320771005383, "speed/FLOPS": 243969922515303.1, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05201317369937897, "optim/lr": 6.221832815733963e-06, "optim/total_tokens": 1990172082176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2678439617156982, "created_at": "2025-06-03T09:46:16.110017+00:00"} {"global_step": 237248, "acc_step": 0, "speed/wps": 5527.4939088676565, "speed/FLOPS": 244286938493367.66, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04716625064611435, "optim/lr": 6.2182855906396385e-06, "optim/total_tokens": 1990180470784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2601028680801392, "created_at": "2025-06-03T09:46:19.078525+00:00"} {"global_step": 237249, "acc_step": 0, "speed/wps": 5520.235212518283, "speed/FLOPS": 243966141268101.3, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04744496941566467, "optim/lr": 6.214738365545092e-06, "optim/total_tokens": 1990188859392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2629388570785522, "created_at": "2025-06-03T09:46:22.050930+00:00"} {"global_step": 237250, "acc_step": 0, "speed/wps": 5510.248290629946, "speed/FLOPS": 243524770438336.94, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04852718487381935, "optim/lr": 6.211191140450545e-06, "optim/total_tokens": 1990197248000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2577364444732666, "created_at": "2025-06-03T09:46:25.028685+00:00"} {"global_step": 237251, "acc_step": 0, "speed/wps": 5535.4804370039, "speed/FLOPS": 244639902158232.88, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.01, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04904186353087425, "optim/lr": 6.20764391535622e-06, "optim/total_tokens": 1990205636608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2718777656555176, "created_at": "2025-06-03T09:46:27.993839+00:00"} {"global_step": 237252, "acc_step": 0, "speed/wps": 5532.7084144671535, "speed/FLOPS": 244517392950606.25, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.1, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0476880706846714, "optim/lr": 6.204096690261674e-06, "optim/total_tokens": 1990214025216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2506897449493408, "created_at": "2025-06-03T09:46:30.959412+00:00"} {"global_step": 237253, "acc_step": 0, "speed/wps": 5533.736112907766, "speed/FLOPS": 244562811961443.84, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04914379492402077, "optim/lr": 6.200549465167127e-06, "optim/total_tokens": 1990222413824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2783421277999878, "created_at": "2025-06-03T09:46:33.924158+00:00"} {"global_step": 237254, "acc_step": 0, "speed/wps": 5538.90015208846, "speed/FLOPS": 244791036061281.88, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05012828856706619, "optim/lr": 6.19700224007258e-06, "optim/total_tokens": 1990230802432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2502919435501099, "created_at": "2025-06-03T09:46:36.887047+00:00"} {"global_step": 237255, "acc_step": 0, "speed/wps": 5532.120497776545, "speed/FLOPS": 244491410042111.75, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047347292304039, "optim/lr": 6.193455014978255e-06, "optim/total_tokens": 1990239191040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2744914293289185, "created_at": "2025-06-03T09:46:39.857989+00:00"} {"global_step": 237256, "acc_step": 0, "speed/wps": 5527.986070570768, "speed/FLOPS": 244308689521533.22, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05115499719977379, "optim/lr": 6.189907789883709e-06, "optim/total_tokens": 1990247579648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2668246030807495, "created_at": "2025-06-03T09:46:42.826139+00:00"} {"global_step": 237257, "acc_step": 0, "speed/wps": 5521.885689788071, "speed/FLOPS": 244039083915517.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.051004648208618164, "optim/lr": 6.186360564789162e-06, "optim/total_tokens": 1990255968256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.247270107269287, "created_at": "2025-06-03T09:46:45.797718+00:00"} {"global_step": 237258, "acc_step": 0, "speed/wps": 5522.149247070188, "speed/FLOPS": 244050731798378.53, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.44 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.44, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046728625893592834, "optim/lr": 6.182813339694615e-06, "optim/total_tokens": 1990264356864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2593108415603638, "created_at": "2025-06-03T09:46:48.768916+00:00"} {"global_step": 237259, "acc_step": 0, "speed/wps": 5520.532001872083, "speed/FLOPS": 243979257838433.66, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04984560236334801, "optim/lr": 6.1792661146002905e-06, "optim/total_tokens": 1990272745472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2682946920394897, "created_at": "2025-06-03T09:46:51.744608+00:00"} {"global_step": 237260, "acc_step": 0, "speed/wps": 5536.805596755158, "speed/FLOPS": 244698467436456.0, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 194.88, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050100695341825485, "optim/lr": 6.175718889505743e-06, "optim/total_tokens": 1990281134080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2640399932861328, "created_at": "2025-06-03T09:46:54.708229+00:00"} {"global_step": 237261, "acc_step": 0, "speed/wps": 5528.349920238727, "speed/FLOPS": 244324769814505.56, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04859704151749611, "optim/lr": 6.172171664411197e-06, "optim/total_tokens": 1990289522688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.256351113319397, "created_at": "2025-06-03T09:46:57.683327+00:00"} {"global_step": 237262, "acc_step": 0, "speed/wps": 5524.312395030392, "speed/FLOPS": 244146331866224.6, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048668041825294495, "optim/lr": 6.1686244393166505e-06, "optim/total_tokens": 1990297911296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2641090154647827, "created_at": "2025-06-03T09:47:00.655278+00:00"} {"global_step": 237263, "acc_step": 0, "speed/wps": 5523.717640520181, "speed/FLOPS": 244120046761102.8, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04821920394897461, "optim/lr": 6.165077214222325e-06, "optim/total_tokens": 1990306299904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2524423599243164, "created_at": "2025-06-03T09:47:03.626303+00:00"} {"global_step": 237264, "acc_step": 0, "speed/wps": 5536.57942294771, "speed/FLOPS": 244688471711829.28, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04666217789053917, "optim/lr": 6.161529989127779e-06, "optim/total_tokens": 1990314688512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2505651712417603, "created_at": "2025-06-03T09:47:06.590196+00:00"} {"global_step": 237265, "acc_step": 0, "speed/wps": 5526.534726732314, "speed/FLOPS": 244244547552524.75, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04728955402970314, "optim/lr": 6.157982764033232e-06, "optim/total_tokens": 1990323077120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2484773397445679, "created_at": "2025-06-03T09:47:09.563136+00:00"} {"global_step": 237266, "acc_step": 0, "speed/wps": 5513.756516527063, "speed/FLOPS": 243679816066261.56, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046639807522296906, "optim/lr": 6.154435538938685e-06, "optim/total_tokens": 1990331465728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.259230613708496, "created_at": "2025-06-03T09:47:12.543866+00:00"} {"global_step": 237267, "acc_step": 0, "speed/wps": 5510.015830958431, "speed/FLOPS": 243514496910692.47, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050278667360544205, "optim/lr": 6.150888313844361e-06, "optim/total_tokens": 1990339854336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2589517831802368, "created_at": "2025-06-03T09:47:15.522818+00:00"} {"global_step": 237268, "acc_step": 0, "speed/wps": 5527.452083088931, "speed/FLOPS": 244285090008031.75, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.43 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.43, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04665660485625267, "optim/lr": 6.1473410887498134e-06, "optim/total_tokens": 1990348242944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2626304626464844, "created_at": "2025-06-03T09:47:18.491454+00:00"} {"global_step": 237269, "acc_step": 0, "speed/wps": 5529.374438459512, "speed/FLOPS": 244370048275904.66, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04676166549324989, "optim/lr": 6.143793863655267e-06, "optim/total_tokens": 1990356631552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.27140474319458, "created_at": "2025-06-03T09:47:21.459168+00:00"} {"global_step": 237270, "acc_step": 0, "speed/wps": 5547.432672973405, "speed/FLOPS": 245168129810995.47, "speed/curr_iter_time": 2.9515, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9515, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 194.53, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047787200659513474, "optim/lr": 6.140246638560721e-06, "optim/total_tokens": 1990365020160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2674872875213623, "created_at": "2025-06-03T09:47:24.417170+00:00"} {"global_step": 237271, "acc_step": 0, "speed/wps": 5536.609745433571, "speed/FLOPS": 244689811810499.8, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 194.98, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048633527010679245, "optim/lr": 6.136699413466395e-06, "optim/total_tokens": 1990373408768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2561367750167847, "created_at": "2025-06-03T09:47:27.381291+00:00"} {"global_step": 237272, "acc_step": 0, "speed/wps": 5538.6710693968025, "speed/FLOPS": 244780911778862.12, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 194.91, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04744506999850273, "optim/lr": 6.133152188371849e-06, "optim/total_tokens": 1990381797376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2386753559112549, "created_at": "2025-06-03T09:47:30.347854+00:00"} {"global_step": 237273, "acc_step": 0, "speed/wps": 5521.052891467861, "speed/FLOPS": 244002278492412.38, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04805336520075798, "optim/lr": 6.129604963277302e-06, "optim/total_tokens": 1990390185984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2824252843856812, "created_at": "2025-06-03T09:47:33.319994+00:00"} {"global_step": 237274, "acc_step": 0, "speed/wps": 5522.917631748199, "speed/FLOPS": 244084690468197.3, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046747058629989624, "optim/lr": 6.126057738182755e-06, "optim/total_tokens": 1990398574592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2740905284881592, "created_at": "2025-06-03T09:47:36.295069+00:00"} {"global_step": 237275, "acc_step": 0, "speed/wps": 5518.784992444762, "speed/FLOPS": 243902048963750.9, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04806544631719589, "optim/lr": 6.122510513088431e-06, "optim/total_tokens": 1990406963200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2517974376678467, "created_at": "2025-06-03T09:47:39.268528+00:00"} {"global_step": 237276, "acc_step": 0, "speed/wps": 5526.53714474934, "speed/FLOPS": 244244654416500.75, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047412000596523285, "optim/lr": 6.118963287993884e-06, "optim/total_tokens": 1990415351808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2521599531173706, "created_at": "2025-06-03T09:47:42.241572+00:00"} {"global_step": 237277, "acc_step": 0, "speed/wps": 5530.197657083625, "speed/FLOPS": 244406430325475.56, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04752393811941147, "optim/lr": 6.115416062899337e-06, "optim/total_tokens": 1990423740416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2708944082260132, "created_at": "2025-06-03T09:47:45.213802+00:00"} {"global_step": 237278, "acc_step": 0, "speed/wps": 5514.108540516613, "speed/FLOPS": 243695373724777.56, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047413405030965805, "optim/lr": 6.111868837805013e-06, "optim/total_tokens": 1990432129024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2619907855987549, "created_at": "2025-06-03T09:47:48.189249+00:00"} {"global_step": 237279, "acc_step": 0, "speed/wps": 5529.219374731991, "speed/FLOPS": 244363195252836.3, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04727810248732567, "optim/lr": 6.1083216127104655e-06, "optim/total_tokens": 1990440517632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2780388593673706, "created_at": "2025-06-03T09:47:51.162585+00:00"} {"global_step": 237280, "acc_step": 0, "speed/wps": 5520.408466335054, "speed/FLOPS": 243973798200009.16, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04696200415492058, "optim/lr": 6.104774387615919e-06, "optim/total_tokens": 1990448906240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2700377702713013, "created_at": "2025-06-03T09:47:54.136093+00:00"} {"global_step": 237281, "acc_step": 0, "speed/wps": 5538.120526475145, "speed/FLOPS": 244756580599659.0, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047332677990198135, "optim/lr": 6.101227162521372e-06, "optim/total_tokens": 1990457294848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2771846055984497, "created_at": "2025-06-03T09:47:57.099023+00:00"} {"global_step": 237282, "acc_step": 0, "speed/wps": 5508.298915097059, "speed/FLOPS": 243438618017591.84, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04748254269361496, "optim/lr": 6.097679937427047e-06, "optim/total_tokens": 1990465683456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2694288492202759, "created_at": "2025-06-03T09:48:00.080847+00:00"} {"global_step": 237283, "acc_step": 0, "speed/wps": 5514.998573033819, "speed/FLOPS": 243734708606438.7, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04752190038561821, "optim/lr": 6.094132712332501e-06, "optim/total_tokens": 1990474072064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.282175898551941, "created_at": "2025-06-03T09:48:03.056464+00:00"} {"global_step": 237284, "acc_step": 0, "speed/wps": 5513.890621056142, "speed/FLOPS": 243685742800037.66, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.42 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.42, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05243512615561485, "optim/lr": 6.090585487237954e-06, "optim/total_tokens": 1990482460672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2535865306854248, "created_at": "2025-06-03T09:48:06.032283+00:00"} {"global_step": 237285, "acc_step": 0, "speed/wps": 5529.601560434543, "speed/FLOPS": 244380085904685.38, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04693043977022171, "optim/lr": 6.087038262143407e-06, "optim/total_tokens": 1990490849280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2490333318710327, "created_at": "2025-06-03T09:48:09.004398+00:00"} {"global_step": 237286, "acc_step": 0, "speed/wps": 5537.9728146573925, "speed/FLOPS": 244750052493371.94, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05026380717754364, "optim/lr": 6.083491037049083e-06, "optim/total_tokens": 1990499237888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2505598068237305, "created_at": "2025-06-03T09:48:11.967518+00:00"} {"global_step": 237287, "acc_step": 0, "speed/wps": 5531.34358419586, "speed/FLOPS": 244457074438449.66, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.09, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.051606953144073486, "optim/lr": 6.079943811954536e-06, "optim/total_tokens": 1990507626496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2689050436019897, "created_at": "2025-06-03T09:48:14.933736+00:00"} {"global_step": 237288, "acc_step": 0, "speed/wps": 5531.4576094247195, "speed/FLOPS": 244462113769931.25, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.18, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046825021505355835, "optim/lr": 6.076396586859989e-06, "optim/total_tokens": 1990516015104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2768858671188354, "created_at": "2025-06-03T09:48:17.900256+00:00"} {"global_step": 237289, "acc_step": 0, "speed/wps": 5522.988268476714, "speed/FLOPS": 244087812250046.16, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0483102984726429, "optim/lr": 6.072849361765442e-06, "optim/total_tokens": 1990524403712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.265861988067627, "created_at": "2025-06-03T09:48:20.875208+00:00"} {"global_step": 237290, "acc_step": 0, "speed/wps": 5523.6755870038605, "speed/FLOPS": 244118188210930.88, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048150185495615005, "optim/lr": 6.0693021366711175e-06, "optim/total_tokens": 1990532792320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2526408433914185, "created_at": "2025-06-03T09:48:23.846137+00:00"} {"global_step": 237291, "acc_step": 0, "speed/wps": 5512.669820825548, "speed/FLOPS": 243631789678467.47, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048058778047561646, "optim/lr": 6.065754911576571e-06, "optim/total_tokens": 1990541180928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.255511999130249, "created_at": "2025-06-03T09:48:26.824311+00:00"} {"global_step": 237292, "acc_step": 0, "speed/wps": 5513.019165102397, "speed/FLOPS": 243647228907398.06, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05215868353843689, "optim/lr": 6.062207686482024e-06, "optim/total_tokens": 1990549569536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2626829147338867, "created_at": "2025-06-03T09:48:29.800716+00:00"} {"global_step": 237293, "acc_step": 0, "speed/wps": 5526.338147420756, "speed/FLOPS": 244235859753138.03, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04943873733282089, "optim/lr": 6.0586604613874775e-06, "optim/total_tokens": 1990557958144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2782466411590576, "created_at": "2025-06-03T09:48:32.769769+00:00"} {"global_step": 237294, "acc_step": 0, "speed/wps": 5531.693452082498, "speed/FLOPS": 244472536808252.88, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04657019302248955, "optim/lr": 6.055113236293153e-06, "optim/total_tokens": 1990566346752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2644680738449097, "created_at": "2025-06-03T09:48:35.739963+00:00"} {"global_step": 237295, "acc_step": 0, "speed/wps": 5533.479232026133, "speed/FLOPS": 244551459141311.22, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.052754390984773636, "optim/lr": 6.051566011198606e-06, "optim/total_tokens": 1990574735360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2643085718154907, "created_at": "2025-06-03T09:48:38.709007+00:00"} {"global_step": 237296, "acc_step": 0, "speed/wps": 5534.7152185986615, "speed/FLOPS": 244606083421464.2, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04947572574019432, "optim/lr": 6.048018786104059e-06, "optim/total_tokens": 1990583123968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.272140383720398, "created_at": "2025-06-03T09:48:41.674450+00:00"} {"global_step": 237297, "acc_step": 0, "speed/wps": 5498.165562895519, "speed/FLOPS": 242990775717482.22, "speed/curr_iter_time": 2.9777, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9777, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046844128519296646, "optim/lr": 6.044471561009512e-06, "optim/total_tokens": 1990591512576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2582106590270996, "created_at": "2025-06-03T09:48:44.663398+00:00"} {"global_step": 237298, "acc_step": 0, "speed/wps": 5511.536061313472, "speed/FLOPS": 243581683311140.9, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.41 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.41, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048314791172742844, "optim/lr": 6.040924335915188e-06, "optim/total_tokens": 1990599901184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2509000301361084, "created_at": "2025-06-03T09:48:47.641314+00:00"} {"global_step": 237299, "acc_step": 0, "speed/wps": 5515.2320451014075, "speed/FLOPS": 243745026876807.72, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04937201738357544, "optim/lr": 6.037377110820641e-06, "optim/total_tokens": 1990608289792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.273608922958374, "created_at": "2025-06-03T09:48:50.616305+00:00"} {"global_step": 237300, "acc_step": 0, "speed/wps": 5514.757136906587, "speed/FLOPS": 243724038365397.16, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048235274851322174, "optim/lr": 6.033829885726094e-06, "optim/total_tokens": 1990616678400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2526090145111084, "created_at": "2025-06-03T09:48:53.593193+00:00"} {"global_step": 237301, "acc_step": 0, "speed/wps": 5513.797003356048, "speed/FLOPS": 243681605376872.3, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048121239989995956, "optim/lr": 6.030282660631548e-06, "optim/total_tokens": 1990625067008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2406617403030396, "created_at": "2025-06-03T09:48:56.569569+00:00"} {"global_step": 237302, "acc_step": 0, "speed/wps": 5538.580238767947, "speed/FLOPS": 244776897529980.0, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 194.94, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04721459373831749, "optim/lr": 6.026735435537223e-06, "optim/total_tokens": 1990633455616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2604548931121826, "created_at": "2025-06-03T09:48:59.533265+00:00"} {"global_step": 237303, "acc_step": 0, "speed/wps": 5540.844294104424, "speed/FLOPS": 244876957187366.56, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04637822508811951, "optim/lr": 6.023188210442676e-06, "optim/total_tokens": 1990641844224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.253595232963562, "created_at": "2025-06-03T09:49:02.496663+00:00"} {"global_step": 237304, "acc_step": 0, "speed/wps": 5538.196322344171, "speed/FLOPS": 244759930389111.5, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047418441623449326, "optim/lr": 6.0196409853481295e-06, "optim/total_tokens": 1990650232832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2719171047210693, "created_at": "2025-06-03T09:49:05.462494+00:00"} {"global_step": 237305, "acc_step": 0, "speed/wps": 5528.267068589199, "speed/FLOPS": 244321108195669.62, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047851815819740295, "optim/lr": 6.016093760253804e-06, "optim/total_tokens": 1990658621440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2612955570220947, "created_at": "2025-06-03T09:49:08.435934+00:00"} {"global_step": 237306, "acc_step": 0, "speed/wps": 5528.797274923487, "speed/FLOPS": 244344540601803.12, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.28, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04788823425769806, "optim/lr": 6.012546535159258e-06, "optim/total_tokens": 1990667010048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2650216817855835, "created_at": "2025-06-03T09:49:11.408775+00:00"} {"global_step": 237307, "acc_step": 0, "speed/wps": 5528.297977188, "speed/FLOPS": 244322474197532.1, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047662489116191864, "optim/lr": 6.0089993100647114e-06, "optim/total_tokens": 1990675398656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2654016017913818, "created_at": "2025-06-03T09:49:14.376677+00:00"} {"global_step": 237308, "acc_step": 0, "speed/wps": 5526.435621539511, "speed/FLOPS": 244240167610269.22, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047890856862068176, "optim/lr": 6.005452084970164e-06, "optim/total_tokens": 1990683787264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2626138925552368, "created_at": "2025-06-03T09:49:17.349053+00:00"} {"global_step": 237309, "acc_step": 0, "speed/wps": 5513.492363981624, "speed/FLOPS": 243668141875808.47, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.4 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.4, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04689627140760422, "optim/lr": 6.00190485987584e-06, "optim/total_tokens": 1990692175872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2613229751586914, "created_at": "2025-06-03T09:49:20.329689+00:00"} {"global_step": 237310, "acc_step": 0, "speed/wps": 5526.889997391828, "speed/FLOPS": 244260248697235.2, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04746096581220627, "optim/lr": 5.998357634781293e-06, "optim/total_tokens": 1990700564480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2766855955123901, "created_at": "2025-06-03T09:49:23.303031+00:00"} {"global_step": 237311, "acc_step": 0, "speed/wps": 5540.635983706326, "speed/FLOPS": 244867750933999.94, "speed/curr_iter_time": 2.9549, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9549, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 194.79, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0477789007127285, "optim/lr": 5.994810409686746e-06, "optim/total_tokens": 1990708953088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.248668909072876, "created_at": "2025-06-03T09:49:26.265549+00:00"} {"global_step": 237312, "acc_step": 0, "speed/wps": 5546.991935584895, "speed/FLOPS": 245148651474321.78, "speed/curr_iter_time": 2.9528, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9528, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 194.65, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04651692509651184, "optim/lr": 5.9912631845922e-06, "optim/total_tokens": 1990717341696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2700679302215576, "created_at": "2025-06-03T09:49:29.223532+00:00"} {"global_step": 237313, "acc_step": 0, "speed/wps": 5521.733343489298, "speed/FLOPS": 244032350988890.72, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04676593840122223, "optim/lr": 5.987715959497874e-06, "optim/total_tokens": 1990725730304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2432749271392822, "created_at": "2025-06-03T09:49:32.195486+00:00"} {"global_step": 237314, "acc_step": 0, "speed/wps": 5524.398655037382, "speed/FLOPS": 244150144117014.8, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04715941473841667, "optim/lr": 5.984168734403328e-06, "optim/total_tokens": 1990734118912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2567148208618164, "created_at": "2025-06-03T09:49:35.167320+00:00"} {"global_step": 237315, "acc_step": 0, "speed/wps": 5525.930732343012, "speed/FLOPS": 244217854092041.16, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04695005714893341, "optim/lr": 5.980621509308782e-06, "optim/total_tokens": 1990742507520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2548165321350098, "created_at": "2025-06-03T09:49:38.137162+00:00"} {"global_step": 237316, "acc_step": 0, "speed/wps": 5517.1807581863495, "speed/FLOPS": 243831150020744.38, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04872702434659004, "optim/lr": 5.977074284214234e-06, "optim/total_tokens": 1990750896128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2501235008239746, "created_at": "2025-06-03T09:49:41.111304+00:00"} {"global_step": 237317, "acc_step": 0, "speed/wps": 5521.2152838245365, "speed/FLOPS": 244009455403378.0, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04724651202559471, "optim/lr": 5.97352705911991e-06, "optim/total_tokens": 1990759284736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.271998643875122, "created_at": "2025-06-03T09:49:44.083402+00:00"} {"global_step": 237318, "acc_step": 0, "speed/wps": 5516.403766577247, "speed/FLOPS": 243796810968625.62, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047562144696712494, "optim/lr": 5.969979834025363e-06, "optim/total_tokens": 1990767673344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2636622190475464, "created_at": "2025-06-03T09:49:47.063790+00:00"} {"global_step": 237319, "acc_step": 0, "speed/wps": 5510.112593360052, "speed/FLOPS": 243518773313569.25, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.39 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.39, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04690276458859444, "optim/lr": 5.966432608930816e-06, "optim/total_tokens": 1990776061952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2520722150802612, "created_at": "2025-06-03T09:49:50.045581+00:00"} {"global_step": 237320, "acc_step": 0, "speed/wps": 5521.4734374044565, "speed/FLOPS": 244020864470260.66, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04695618897676468, "optim/lr": 5.96288538383627e-06, "optim/total_tokens": 1990784450560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2483575344085693, "created_at": "2025-06-03T09:49:53.021157+00:00"} {"global_step": 237321, "acc_step": 0, "speed/wps": 5522.751125126483, "speed/FLOPS": 244077331727775.62, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046827539801597595, "optim/lr": 5.9593381587419445e-06, "optim/total_tokens": 1990792839168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2528971433639526, "created_at": "2025-06-03T09:49:55.995897+00:00"} {"global_step": 237322, "acc_step": 0, "speed/wps": 5526.2699061260255, "speed/FLOPS": 244232843837201.53, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04674364998936653, "optim/lr": 5.955790933647398e-06, "optim/total_tokens": 1990801227776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2614177465438843, "created_at": "2025-06-03T09:49:58.965321+00:00"} {"global_step": 237323, "acc_step": 0, "speed/wps": 5525.200147590411, "speed/FLOPS": 244185565985447.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04680430516600609, "optim/lr": 5.952243708552852e-06, "optim/total_tokens": 1990809616384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2452481985092163, "created_at": "2025-06-03T09:50:01.935915+00:00"} {"global_step": 237324, "acc_step": 0, "speed/wps": 5529.4024166615, "speed/FLOPS": 244371284769227.1, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0470539852976799, "optim/lr": 5.9486964834583045e-06, "optim/total_tokens": 1990818004992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2596240043640137, "created_at": "2025-06-03T09:50:04.906526+00:00"} {"global_step": 237325, "acc_step": 0, "speed/wps": 5519.80650730506, "speed/FLOPS": 243947194691989.06, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04809272289276123, "optim/lr": 5.94514925836398e-06, "optim/total_tokens": 1990826393600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2556360960006714, "created_at": "2025-06-03T09:50:07.879089+00:00"} {"global_step": 237326, "acc_step": 0, "speed/wps": 5515.485840381947, "speed/FLOPS": 243756243329165.56, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047153323888778687, "optim/lr": 5.941602033269433e-06, "optim/total_tokens": 1990834782208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2656738758087158, "created_at": "2025-06-03T09:50:10.853770+00:00"} {"global_step": 237327, "acc_step": 0, "speed/wps": 5521.672043374367, "speed/FLOPS": 244029641837573.2, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04766124486923218, "optim/lr": 5.938054808174886e-06, "optim/total_tokens": 1990843170816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.266420841217041, "created_at": "2025-06-03T09:50:13.831908+00:00"} {"global_step": 237328, "acc_step": 0, "speed/wps": 5529.171772008491, "speed/FLOPS": 244361091456110.44, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04789155721664429, "optim/lr": 5.93450758308034e-06, "optim/total_tokens": 1990851559424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2702096700668335, "created_at": "2025-06-03T09:50:16.799704+00:00"} {"global_step": 237329, "acc_step": 0, "speed/wps": 5505.4850088854, "speed/FLOPS": 243314257765914.16, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.38 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.38, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04704954847693443, "optim/lr": 5.930960357986015e-06, "optim/total_tokens": 1990859948032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.259650707244873, "created_at": "2025-06-03T09:50:19.780434+00:00"} {"global_step": 237330, "acc_step": 0, "speed/wps": 5527.89181512219, "speed/FLOPS": 244304523913149.2, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05006512254476547, "optim/lr": 5.927413132891468e-06, "optim/total_tokens": 1990868336640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2648042440414429, "created_at": "2025-06-03T09:50:22.752730+00:00"} {"global_step": 237331, "acc_step": 0, "speed/wps": 5527.286947957625, "speed/FLOPS": 244277791880466.22, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04765012115240097, "optim/lr": 5.923865907796922e-06, "optim/total_tokens": 1990876725248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2464559078216553, "created_at": "2025-06-03T09:50:25.723343+00:00"} {"global_step": 237332, "acc_step": 0, "speed/wps": 5525.2799489864265, "speed/FLOPS": 244189092798691.25, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047539081424474716, "optim/lr": 5.9203186827025966e-06, "optim/total_tokens": 1990885113856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2650636434555054, "created_at": "2025-06-03T09:50:28.694266+00:00"} {"global_step": 237333, "acc_step": 0, "speed/wps": 5518.048152320003, "speed/FLOPS": 243869484401726.22, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.051291514188051224, "optim/lr": 5.91677145760805e-06, "optim/total_tokens": 1990893502464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2659542560577393, "created_at": "2025-06-03T09:50:31.668275+00:00"} {"global_step": 237334, "acc_step": 0, "speed/wps": 5511.930753677631, "speed/FLOPS": 243599126693418.12, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05663566663861275, "optim/lr": 5.913224232513503e-06, "optim/total_tokens": 1990901891072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2826166152954102, "created_at": "2025-06-03T09:50:34.652026+00:00"} {"global_step": 237335, "acc_step": 0, "speed/wps": 5513.640186303653, "speed/FLOPS": 243674674865818.9, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04645712301135063, "optim/lr": 5.9096770074189565e-06, "optim/total_tokens": 1990910279680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2542768716812134, "created_at": "2025-06-03T09:50:37.630381+00:00"} {"global_step": 237336, "acc_step": 0, "speed/wps": 5524.539134731696, "speed/FLOPS": 244156352600463.25, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04752640798687935, "optim/lr": 5.906129782324632e-06, "optim/total_tokens": 1990918668288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2619237899780273, "created_at": "2025-06-03T09:50:40.604222+00:00"} {"global_step": 237337, "acc_step": 0, "speed/wps": 5531.527323801817, "speed/FLOPS": 244465194788568.44, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04845438152551651, "optim/lr": 5.902582557230085e-06, "optim/total_tokens": 1990927056896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2654200792312622, "created_at": "2025-06-03T09:50:43.571475+00:00"} {"global_step": 237338, "acc_step": 0, "speed/wps": 5522.67383697057, "speed/FLOPS": 244073915986880.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04753216356039047, "optim/lr": 5.8990353321355384e-06, "optim/total_tokens": 1990935445504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2691774368286133, "created_at": "2025-06-03T09:50:46.543377+00:00"} {"global_step": 237339, "acc_step": 0, "speed/wps": 5524.43250645949, "speed/FLOPS": 244151640176604.7, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04793296754360199, "optim/lr": 5.895488107040991e-06, "optim/total_tokens": 1990943834112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2604197263717651, "created_at": "2025-06-03T09:50:49.517550+00:00"} {"global_step": 237340, "acc_step": 0, "speed/wps": 5532.827290382504, "speed/FLOPS": 244522646657602.62, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04717595502734184, "optim/lr": 5.891940881946667e-06, "optim/total_tokens": 1990952222720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2490555047988892, "created_at": "2025-06-03T09:50:52.483307+00:00"} {"global_step": 237341, "acc_step": 0, "speed/wps": 5513.746958711755, "speed/FLOPS": 243679393659746.28, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0471465140581131, "optim/lr": 5.88839365685212e-06, "optim/total_tokens": 1990960611328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2545766830444336, "created_at": "2025-06-03T09:50:55.459805+00:00"} {"global_step": 237342, "acc_step": 0, "speed/wps": 5520.972827044709, "speed/FLOPS": 243998740054715.94, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04871070757508278, "optim/lr": 5.884846431757573e-06, "optim/total_tokens": 1990968999936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2604562044143677, "created_at": "2025-06-03T09:50:58.434860+00:00"} {"global_step": 237343, "acc_step": 0, "speed/wps": 5514.005970677546, "speed/FLOPS": 243690840662890.84, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.37 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.37, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04732231795787811, "optim/lr": 5.881299206663027e-06, "optim/total_tokens": 1990977388544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2672845125198364, "created_at": "2025-06-03T09:51:01.410723+00:00"} {"global_step": 237344, "acc_step": 0, "speed/wps": 5519.168893546338, "speed/FLOPS": 243919015427456.6, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04652616009116173, "optim/lr": 5.877751981568702e-06, "optim/total_tokens": 1990985777152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2599045038223267, "created_at": "2025-06-03T09:51:04.384259+00:00"} {"global_step": 237345, "acc_step": 0, "speed/wps": 5528.311392722772, "speed/FLOPS": 244323067095502.1, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04739804193377495, "optim/lr": 5.874204756474155e-06, "optim/total_tokens": 1990994165760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2655872106552124, "created_at": "2025-06-03T09:51:07.352455+00:00"} {"global_step": 237346, "acc_step": 0, "speed/wps": 5520.62942763026, "speed/FLOPS": 243983563558274.8, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04676913842558861, "optim/lr": 5.870657531379609e-06, "optim/total_tokens": 1991002554368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.255753517150879, "created_at": "2025-06-03T09:51:10.328556+00:00"} {"global_step": 237347, "acc_step": 0, "speed/wps": 5530.888681426183, "speed/FLOPS": 244436970064433.4, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0470597967505455, "optim/lr": 5.867110306285061e-06, "optim/total_tokens": 1991010942976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.262013554573059, "created_at": "2025-06-03T09:51:13.296652+00:00"} {"global_step": 237348, "acc_step": 0, "speed/wps": 5525.589425544466, "speed/FLOPS": 244202770078512.0, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046765055507421494, "optim/lr": 5.863563081190737e-06, "optim/total_tokens": 1991019331584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2544279098510742, "created_at": "2025-06-03T09:51:16.266188+00:00"} {"global_step": 237349, "acc_step": 0, "speed/wps": 5520.567296218608, "speed/FLOPS": 243980817667897.22, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04883617162704468, "optim/lr": 5.8600158560961905e-06, "optim/total_tokens": 1991027720192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2673066854476929, "created_at": "2025-06-03T09:51:19.238453+00:00"} {"global_step": 237350, "acc_step": 0, "speed/wps": 5500.462902398653, "speed/FLOPS": 243092306364671.2, "speed/curr_iter_time": 2.9778, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9778, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04676060751080513, "optim/lr": 5.856468631001643e-06, "optim/total_tokens": 1991036108800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.285020112991333, "created_at": "2025-06-03T09:51:22.221281+00:00"} {"global_step": 237351, "acc_step": 0, "speed/wps": 5518.194785843802, "speed/FLOPS": 243875964852939.7, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04639497771859169, "optim/lr": 5.852921405907097e-06, "optim/total_tokens": 1991044497408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2729322910308838, "created_at": "2025-06-03T09:51:25.194505+00:00"} {"global_step": 237352, "acc_step": 0, "speed/wps": 5528.039496446605, "speed/FLOPS": 244311050671786.8, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047655463218688965, "optim/lr": 5.849374180812772e-06, "optim/total_tokens": 1991052886016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2687479257583618, "created_at": "2025-06-03T09:51:28.164017+00:00"} {"global_step": 237353, "acc_step": 0, "speed/wps": 5528.180021526985, "speed/FLOPS": 244317261161067.03, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0481722429394722, "optim/lr": 5.845826955718225e-06, "optim/total_tokens": 1991061274624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2723253965377808, "created_at": "2025-06-03T09:51:31.133137+00:00"} {"global_step": 237354, "acc_step": 0, "speed/wps": 5526.775034842283, "speed/FLOPS": 244255167940976.97, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05107775330543518, "optim/lr": 5.842279730623679e-06, "optim/total_tokens": 1991069663232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.252359390258789, "created_at": "2025-06-03T09:51:34.105439+00:00"} {"global_step": 237355, "acc_step": 0, "speed/wps": 5526.738290722443, "speed/FLOPS": 244253544038953.5, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04710109531879425, "optim/lr": 5.8387325055291315e-06, "optim/total_tokens": 1991078051840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2736763954162598, "created_at": "2025-06-03T09:51:37.074019+00:00"} {"global_step": 237356, "acc_step": 0, "speed/wps": 5523.056442186417, "speed/FLOPS": 244090825179070.34, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04772799834609032, "optim/lr": 5.835185280434807e-06, "optim/total_tokens": 1991086440448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2528151273727417, "created_at": "2025-06-03T09:51:40.044543+00:00"} {"global_step": 237357, "acc_step": 0, "speed/wps": 5517.0931705650855, "speed/FLOPS": 243827279096198.6, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0501522570848465, "optim/lr": 5.831638055340261e-06, "optim/total_tokens": 1991094829056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.253867268562317, "created_at": "2025-06-03T09:51:43.021908+00:00"} {"global_step": 237358, "acc_step": 0, "speed/wps": 5514.202648428634, "speed/FLOPS": 243699532812800.94, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047823768109083176, "optim/lr": 5.828090830245713e-06, "optim/total_tokens": 1991103217664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2517184019088745, "created_at": "2025-06-03T09:51:45.997756+00:00"} {"global_step": 237359, "acc_step": 0, "speed/wps": 5509.822570885172, "speed/FLOPS": 243505955804649.16, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.36 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.36, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047205761075019836, "optim/lr": 5.824543605151389e-06, "optim/total_tokens": 1991111606272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2622404098510742, "created_at": "2025-06-03T09:51:48.980199+00:00"} {"global_step": 237360, "acc_step": 0, "speed/wps": 5512.437257847282, "speed/FLOPS": 243621511585193.3, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047112490981817245, "optim/lr": 5.8209963800568425e-06, "optim/total_tokens": 1991119994880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2670847177505493, "created_at": "2025-06-03T09:51:51.957153+00:00"} {"global_step": 237361, "acc_step": 0, "speed/wps": 5508.997343326105, "speed/FLOPS": 243469484970435.9, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04774956777691841, "optim/lr": 5.817449154962295e-06, "optim/total_tokens": 1991128383488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2449601888656616, "created_at": "2025-06-03T09:51:54.940183+00:00"} {"global_step": 237362, "acc_step": 0, "speed/wps": 5518.419932636315, "speed/FLOPS": 243885915188763.03, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04892483353614807, "optim/lr": 5.813901929867749e-06, "optim/total_tokens": 1991136772096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2747457027435303, "created_at": "2025-06-03T09:51:57.918807+00:00"} {"global_step": 237363, "acc_step": 0, "speed/wps": 5522.20949172244, "speed/FLOPS": 244053394303648.03, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.0473901741206646, "optim/lr": 5.8103547047734236e-06, "optim/total_tokens": 1991145160704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2728137969970703, "created_at": "2025-06-03T09:52:00.890284+00:00"} {"global_step": 237364, "acc_step": 0, "speed/wps": 5523.711230709343, "speed/FLOPS": 244119763480272.2, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04887528344988823, "optim/lr": 5.806807479678877e-06, "optim/total_tokens": 1991153549312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.255635380744934, "created_at": "2025-06-03T09:52:03.864056+00:00"} {"global_step": 237365, "acc_step": 0, "speed/wps": 5521.803910930957, "speed/FLOPS": 244035469708615.12, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04592649266123772, "optim/lr": 5.803260254584331e-06, "optim/total_tokens": 1991161937920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2560762166976929, "created_at": "2025-06-03T09:52:06.840883+00:00"} {"global_step": 237366, "acc_step": 0, "speed/wps": 5514.719580001117, "speed/FLOPS": 243722378542409.03, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04677961394190788, "optim/lr": 5.7997130294897835e-06, "optim/total_tokens": 1991170326528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2499470710754395, "created_at": "2025-06-03T09:52:09.820960+00:00"} {"global_step": 237367, "acc_step": 0, "speed/wps": 5516.691204030305, "speed/FLOPS": 243809514232812.53, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047141820192337036, "optim/lr": 5.796165804395459e-06, "optim/total_tokens": 1991178715136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2661877870559692, "created_at": "2025-06-03T09:52:12.796276+00:00"} {"global_step": 237368, "acc_step": 0, "speed/wps": 5507.872352337696, "speed/FLOPS": 243419766126974.12, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046876080334186554, "optim/lr": 5.792618579300913e-06, "optim/total_tokens": 1991187103744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.251482367515564, "created_at": "2025-06-03T09:52:15.778603+00:00"} {"global_step": 237369, "acc_step": 0, "speed/wps": 5506.340299535599, "speed/FLOPS": 243352057234878.56, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.35 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.35, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04698449373245239, "optim/lr": 5.7890713542063654e-06, "optim/total_tokens": 1991195492352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2671780586242676, "created_at": "2025-06-03T09:52:18.758680+00:00"} {"global_step": 237370, "acc_step": 0, "speed/wps": 5532.943272710277, "speed/FLOPS": 244527772482838.8, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047850195318460464, "optim/lr": 5.785524129111819e-06, "optim/total_tokens": 1991203880960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.280099868774414, "created_at": "2025-06-03T09:52:21.726098+00:00"} {"global_step": 237371, "acc_step": 0, "speed/wps": 5540.898995413131, "speed/FLOPS": 244879374705224.75, "speed/curr_iter_time": 2.9547, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9547, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 194.82, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046500373631715775, "optim/lr": 5.781976904017494e-06, "optim/total_tokens": 1991212269568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2575503587722778, "created_at": "2025-06-03T09:52:24.687611+00:00"} {"global_step": 237372, "acc_step": 0, "speed/wps": 5507.562935461847, "speed/FLOPS": 243406091484800.72, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047697875648736954, "optim/lr": 5.778429678922947e-06, "optim/total_tokens": 1991220658176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2695813179016113, "created_at": "2025-06-03T09:52:27.673421+00:00"} {"global_step": 237373, "acc_step": 0, "speed/wps": 5508.551531933077, "speed/FLOPS": 243449782388733.66, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047448884695768356, "optim/lr": 5.774882453828401e-06, "optim/total_tokens": 1991229046784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2699987888336182, "created_at": "2025-06-03T09:52:30.654992+00:00"} {"global_step": 237374, "acc_step": 0, "speed/wps": 5517.795416577947, "speed/FLOPS": 243858314775546.16, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04698294773697853, "optim/lr": 5.771335228733854e-06, "optim/total_tokens": 1991237435392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2601410150527954, "created_at": "2025-06-03T09:52:33.630377+00:00"} {"global_step": 237375, "acc_step": 0, "speed/wps": 5509.962017293101, "speed/FLOPS": 243512118622128.2, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04774807393550873, "optim/lr": 5.767788003639529e-06, "optim/total_tokens": 1991245824000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.255346417427063, "created_at": "2025-06-03T09:52:36.608927+00:00"} {"global_step": 237376, "acc_step": 0, "speed/wps": 5511.916180582395, "speed/FLOPS": 243598482637200.53, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048364099115133286, "optim/lr": 5.764240778544983e-06, "optim/total_tokens": 1991254212608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2743945121765137, "created_at": "2025-06-03T09:52:39.586028+00:00"} {"global_step": 237377, "acc_step": 0, "speed/wps": 5515.131605933505, "speed/FLOPS": 243740587979680.7, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.047614481300115585, "optim/lr": 5.760693553450436e-06, "optim/total_tokens": 1991262601216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2580252885818481, "created_at": "2025-06-03T09:52:42.565789+00:00"} {"global_step": 237378, "acc_step": 0, "speed/wps": 5524.39455136348, "speed/FLOPS": 244149962755632.88, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04647916182875633, "optim/lr": 5.757146328355889e-06, "optim/total_tokens": 1991270989824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2577217817306519, "created_at": "2025-06-03T09:52:45.538792+00:00"} {"global_step": 237379, "acc_step": 0, "speed/wps": 5521.21525393366, "speed/FLOPS": 244009454082354.28, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04817957431077957, "optim/lr": 5.753599103261564e-06, "optim/total_tokens": 1991279378432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2619811296463013, "created_at": "2025-06-03T09:52:48.510433+00:00"} {"global_step": 237380, "acc_step": 0, "speed/wps": 5515.883314108999, "speed/FLOPS": 243773809633446.28, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04731157422065735, "optim/lr": 5.7500518781670175e-06, "optim/total_tokens": 1991287767040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2577444314956665, "created_at": "2025-06-03T09:52:51.486469+00:00"} {"global_step": 237381, "acc_step": 0, "speed/wps": 5517.216550412075, "speed/FLOPS": 243832731853920.22, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04830247908830643, "optim/lr": 5.746504653072471e-06, "optim/total_tokens": 1991296155648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.270184874534607, "created_at": "2025-06-03T09:52:54.460800+00:00"} {"global_step": 237382, "acc_step": 0, "speed/wps": 5514.120191324917, "speed/FLOPS": 243695888630870.38, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.34 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.34, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046760931611061096, "optim/lr": 5.742957427977924e-06, "optim/total_tokens": 1991304544256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2683660984039307, "created_at": "2025-06-03T09:52:57.439532+00:00"} {"global_step": 237383, "acc_step": 0, "speed/wps": 5512.236512860078, "speed/FLOPS": 243612639684264.88, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05108420550823212, "optim/lr": 5.739410202883599e-06, "optim/total_tokens": 1991312932864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.269650936126709, "created_at": "2025-06-03T09:53:00.417523+00:00"} {"global_step": 237384, "acc_step": 0, "speed/wps": 5511.815428263051, "speed/FLOPS": 243594029900382.66, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04882349446415901, "optim/lr": 5.735862977789052e-06, "optim/total_tokens": 1991321321472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2735296487808228, "created_at": "2025-06-03T09:53:03.396158+00:00"} {"global_step": 237385, "acc_step": 0, "speed/wps": 5513.7075764382525, "speed/FLOPS": 243677653164834.25, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04661370813846588, "optim/lr": 5.732315752694506e-06, "optim/total_tokens": 1991329710080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.254942536354065, "created_at": "2025-06-03T09:53:06.372436+00:00"} {"global_step": 237386, "acc_step": 0, "speed/wps": 5524.050888357862, "speed/FLOPS": 244134774609811.28, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.048314936459064484, "optim/lr": 5.728768527600181e-06, "optim/total_tokens": 1991338098688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.265999436378479, "created_at": "2025-06-03T09:53:09.346508+00:00"} {"global_step": 237387, "acc_step": 0, "speed/wps": 5513.536927140467, "speed/FLOPS": 243670111339334.4, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04793212562799454, "optim/lr": 5.725221302505634e-06, "optim/total_tokens": 1991346487296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2539714574813843, "created_at": "2025-06-03T09:53:12.324644+00:00"} {"global_step": 237388, "acc_step": 0, "speed/wps": 5525.215137643376, "speed/FLOPS": 244186228469062.94, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04776836186647415, "optim/lr": 5.721674077411088e-06, "optim/total_tokens": 1991354875904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.273991584777832, "created_at": "2025-06-03T09:53:15.294474+00:00"} {"global_step": 237389, "acc_step": 0, "speed/wps": 5515.404002842211, "speed/FLOPS": 243752626528791.75, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04701115936040878, "optim/lr": 5.718126852316541e-06, "optim/total_tokens": 1991363264512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.265108585357666, "created_at": "2025-06-03T09:53:18.271516+00:00"} {"global_step": 237390, "acc_step": 0, "speed/wps": 5529.419635427345, "speed/FLOPS": 244372045750543.84, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04887903481721878, "optim/lr": 5.714579627222216e-06, "optim/total_tokens": 1991371653120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2594226598739624, "created_at": "2025-06-03T09:53:21.243100+00:00"} {"global_step": 237391, "acc_step": 0, "speed/wps": 5521.683331453454, "speed/FLOPS": 244030140712891.22, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046317923814058304, "optim/lr": 5.7110324021276695e-06, "optim/total_tokens": 1991380041728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.278520107269287, "created_at": "2025-06-03T09:53:24.216296+00:00"} {"global_step": 237392, "acc_step": 0, "speed/wps": 5517.185711097095, "speed/FLOPS": 243831368914048.03, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.050510942935943604, "optim/lr": 5.707485177033122e-06, "optim/total_tokens": 1991388430336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2493789196014404, "created_at": "2025-06-03T09:53:27.190825+00:00"} {"global_step": 237393, "acc_step": 0, "speed/wps": 5511.834638468822, "speed/FLOPS": 243594878893150.97, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.33 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.33, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04627472907304764, "optim/lr": 5.703937951938576e-06, "optim/total_tokens": 1991396818944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.257866382598877, "created_at": "2025-06-03T09:53:30.170055+00:00"} {"global_step": 237394, "acc_step": 0, "speed/wps": 5518.088561135986, "speed/FLOPS": 243871270264561.6, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04789168760180473, "optim/lr": 5.700390726844251e-06, "optim/total_tokens": 1991405207552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2709752321243286, "created_at": "2025-06-03T09:53:33.143730+00:00"} {"global_step": 237395, "acc_step": 0, "speed/wps": 5523.700198827979, "speed/FLOPS": 244119275927582.2, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.05246531590819359, "optim/lr": 5.696843501749704e-06, "optim/total_tokens": 1991413596160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2716577053070068, "created_at": "2025-06-03T09:53:36.117733+00:00"} {"global_step": 237396, "acc_step": 0, "speed/wps": 5522.411255443865, "speed/FLOPS": 244062311227414.66, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.046770092099905014, "optim/lr": 5.693296276655158e-06, "optim/total_tokens": 1991421984768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2737250328063965, "created_at": "2025-06-03T09:53:39.093216+00:00"} {"global_step": 237397, "acc_step": 0, "speed/wps": 5514.683883263308, "speed/FLOPS": 243720800929310.38, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.06, "optim/grad_norm": 0.04910316318273544, "optim/lr": 5.6897490515606105e-06, "optim/total_tokens": 1991430373376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2754805088043213, "created_at": "2025-06-03T09:53:42.068963+00:00"} {"global_step": 237398, "acc_step": 0, "speed/wps": 5528.102969596676, "speed/FLOPS": 244313855860134.9, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0513918474316597, "optim/lr": 5.686201826466286e-06, "optim/total_tokens": 1991438761984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2503666877746582, "created_at": "2025-06-03T09:53:45.038246+00:00"} {"global_step": 237399, "acc_step": 0, "speed/wps": 5533.214901942574, "speed/FLOPS": 244539777104581.94, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04670132324099541, "optim/lr": 5.68265460137174e-06, "optim/total_tokens": 1991447150592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2527214288711548, "created_at": "2025-06-03T09:53:48.005441+00:00"} {"global_step": 237400, "acc_step": 0, "speed/wps": 5520.001396784054, "speed/FLOPS": 243955807809425.8, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049488555639982224, "optim/lr": 5.6791073762771924e-06, "optim/total_tokens": 1991455539200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26262629032135, "created_at": "2025-06-03T09:53:50.980080+00:00"} {"global_step": 237401, "acc_step": 0, "speed/wps": 5522.851454937408, "speed/FLOPS": 244081765791883.97, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047777384519577026, "optim/lr": 5.675560151182646e-06, "optim/total_tokens": 1991463927808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2679498195648193, "created_at": "2025-06-03T09:53:53.954688+00:00"} {"global_step": 237402, "acc_step": 0, "speed/wps": 5519.706498081254, "speed/FLOPS": 243942774796190.44, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046754930168390274, "optim/lr": 5.6720129260883216e-06, "optim/total_tokens": 1991472316416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2751585245132446, "created_at": "2025-06-03T09:53:56.927900+00:00"} {"global_step": 237403, "acc_step": 0, "speed/wps": 5529.8362944722485, "speed/FLOPS": 244390459947674.22, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04704717919230461, "optim/lr": 5.668465700993774e-06, "optim/total_tokens": 1991480705024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2640982866287231, "created_at": "2025-06-03T09:53:59.896512+00:00"} {"global_step": 237404, "acc_step": 0, "speed/wps": 5527.024460244231, "speed/FLOPS": 244266191267068.12, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04866984486579895, "optim/lr": 5.664918475899228e-06, "optim/total_tokens": 1991489093632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2760326862335205, "created_at": "2025-06-03T09:54:02.866917+00:00"} {"global_step": 237405, "acc_step": 0, "speed/wps": 5526.636160262205, "speed/FLOPS": 244249030395362.03, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04935489594936371, "optim/lr": 5.661371250804681e-06, "optim/total_tokens": 1991497482240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2566606998443604, "created_at": "2025-06-03T09:54:05.837492+00:00"} {"global_step": 237406, "acc_step": 0, "speed/wps": 5524.023671989413, "speed/FLOPS": 244133571785631.8, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046922601759433746, "optim/lr": 5.657824025710356e-06, "optim/total_tokens": 1991505870848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2661101818084717, "created_at": "2025-06-03T09:54:08.811376+00:00"} {"global_step": 237407, "acc_step": 0, "speed/wps": 5506.684468579271, "speed/FLOPS": 243367267744992.0, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.32 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.32, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047085002064704895, "optim/lr": 5.65427680061581e-06, "optim/total_tokens": 1991514259456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.270547866821289, "created_at": "2025-06-03T09:54:11.791674+00:00"} {"global_step": 237408, "acc_step": 0, "speed/wps": 5517.327277264455, "speed/FLOPS": 243837625414044.0, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04685165360569954, "optim/lr": 5.650729575521263e-06, "optim/total_tokens": 1991522648064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.273429036140442, "created_at": "2025-06-03T09:54:14.765815+00:00"} {"global_step": 237409, "acc_step": 0, "speed/wps": 5513.047386200631, "speed/FLOPS": 243648476135491.34, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046486616134643555, "optim/lr": 5.647182350426716e-06, "optim/total_tokens": 1991531036672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2765809297561646, "created_at": "2025-06-03T09:54:17.744259+00:00"} {"global_step": 237410, "acc_step": 0, "speed/wps": 5519.700025271335, "speed/FLOPS": 243942488731122.88, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04776931181550026, "optim/lr": 5.643635125332392e-06, "optim/total_tokens": 1991539425280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.257368803024292, "created_at": "2025-06-03T09:54:20.717010+00:00"} {"global_step": 237411, "acc_step": 0, "speed/wps": 5511.20921120383, "speed/FLOPS": 243567238209265.28, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047308050096035004, "optim/lr": 5.6400879002378445e-06, "optim/total_tokens": 1991547813888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2650880813598633, "created_at": "2025-06-03T09:54:23.694366+00:00"} {"global_step": 237412, "acc_step": 0, "speed/wps": 5533.300557811974, "speed/FLOPS": 244543562655582.9, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.11, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046693556010723114, "optim/lr": 5.636540675143298e-06, "optim/total_tokens": 1991556202496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2803922891616821, "created_at": "2025-06-03T09:54:26.662297+00:00"} {"global_step": 237413, "acc_step": 0, "speed/wps": 5521.820218846031, "speed/FLOPS": 244036190434989.94, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04755350202322006, "optim/lr": 5.632993450048974e-06, "optim/total_tokens": 1991564591104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2605828046798706, "created_at": "2025-06-03T09:54:29.639706+00:00"} {"global_step": 237414, "acc_step": 0, "speed/wps": 5513.912319680714, "speed/FLOPS": 243686701768180.12, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0470544770359993, "optim/lr": 5.629446224954426e-06, "optim/total_tokens": 1991572979712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2718924283981323, "created_at": "2025-06-03T09:54:32.618626+00:00"} {"global_step": 237415, "acc_step": 0, "speed/wps": 5517.277355825183, "speed/FLOPS": 243835419141949.28, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046145129948854446, "optim/lr": 5.62589899985988e-06, "optim/total_tokens": 1991581368320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2636361122131348, "created_at": "2025-06-03T09:54:35.593521+00:00"} {"global_step": 237416, "acc_step": 0, "speed/wps": 5512.814262307535, "speed/FLOPS": 243638173252652.72, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048270102590322495, "optim/lr": 5.622351774765333e-06, "optim/total_tokens": 1991589756928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2515511512756348, "created_at": "2025-06-03T09:54:38.573515+00:00"} {"global_step": 237417, "acc_step": 0, "speed/wps": 5512.283779949377, "speed/FLOPS": 243614728647677.03, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04717142507433891, "optim/lr": 5.618804549671008e-06, "optim/total_tokens": 1991598145536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2749181985855103, "created_at": "2025-06-03T09:54:41.551210+00:00"} {"global_step": 237418, "acc_step": 0, "speed/wps": 5508.802709984247, "speed/FLOPS": 243460883172949.53, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.31 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.31, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04722515866160393, "optim/lr": 5.615257324576462e-06, "optim/total_tokens": 1991606534144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2761411666870117, "created_at": "2025-06-03T09:54:44.530417+00:00"} {"global_step": 237419, "acc_step": 0, "speed/wps": 5515.711010873084, "speed/FLOPS": 243766194712346.75, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04896145686507225, "optim/lr": 5.611710099481915e-06, "optim/total_tokens": 1991614922752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.267661452293396, "created_at": "2025-06-03T09:54:47.506686+00:00"} {"global_step": 237420, "acc_step": 0, "speed/wps": 5532.662317210487, "speed/FLOPS": 244515355687808.75, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049561791121959686, "optim/lr": 5.608162874387368e-06, "optim/total_tokens": 1991623311360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2457380294799805, "created_at": "2025-06-03T09:54:50.478226+00:00"} {"global_step": 237421, "acc_step": 0, "speed/wps": 5509.090620846204, "speed/FLOPS": 243473607359386.66, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04890770465135574, "optim/lr": 5.604615649293044e-06, "optim/total_tokens": 1991631699968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2545682191848755, "created_at": "2025-06-03T09:54:53.456798+00:00"} {"global_step": 237422, "acc_step": 0, "speed/wps": 5533.768903456424, "speed/FLOPS": 244564261135857.28, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.12, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04870852082967758, "optim/lr": 5.6010684241984965e-06, "optim/total_tokens": 1991640088576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.259856939315796, "created_at": "2025-06-03T09:54:56.425838+00:00"} {"global_step": 237423, "acc_step": 0, "speed/wps": 5518.832477949553, "speed/FLOPS": 243904147580009.84, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04691700637340546, "optim/lr": 5.59752119910395e-06, "optim/total_tokens": 1991648477184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2529371976852417, "created_at": "2025-06-03T09:54:59.400245+00:00"} {"global_step": 237424, "acc_step": 0, "speed/wps": 5521.665516994038, "speed/FLOPS": 244029353404967.7, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04933419078588486, "optim/lr": 5.593973974009403e-06, "optim/total_tokens": 1991656865792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2578232288360596, "created_at": "2025-06-03T09:55:02.372216+00:00"} {"global_step": 237425, "acc_step": 0, "speed/wps": 5513.65266287382, "speed/FLOPS": 243675226266359.44, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05082092061638832, "optim/lr": 5.590426748915078e-06, "optim/total_tokens": 1991665254400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.26029372215271, "created_at": "2025-06-03T09:55:05.348352+00:00"} {"global_step": 237426, "acc_step": 0, "speed/wps": 5522.990470986309, "speed/FLOPS": 244087909589696.78, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04671900346875191, "optim/lr": 5.586879523820532e-06, "optim/total_tokens": 1991673643008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.270790457725525, "created_at": "2025-06-03T09:55:08.320171+00:00"} {"global_step": 237427, "acc_step": 0, "speed/wps": 5506.98661969478, "speed/FLOPS": 243380621277747.88, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049027204513549805, "optim/lr": 5.583332298725985e-06, "optim/total_tokens": 1991682031616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2656747102737427, "created_at": "2025-06-03T09:55:11.303780+00:00"} {"global_step": 237428, "acc_step": 0, "speed/wps": 5512.324337991442, "speed/FLOPS": 243616521105541.4, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.3 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.3, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0504266582429409, "optim/lr": 5.579785073631438e-06, "optim/total_tokens": 1991690420224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2826740741729736, "created_at": "2025-06-03T09:55:14.280949+00:00"} {"global_step": 237429, "acc_step": 0, "speed/wps": 5532.359780452741, "speed/FLOPS": 244501985111639.84, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.050486091524362564, "optim/lr": 5.576237848537113e-06, "optim/total_tokens": 1991698808832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2702347040176392, "created_at": "2025-06-03T09:55:17.246703+00:00"} {"global_step": 237430, "acc_step": 0, "speed/wps": 5522.883010852948, "speed/FLOPS": 244083160401833.06, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04707104340195656, "optim/lr": 5.572690623442567e-06, "optim/total_tokens": 1991707197440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2511866092681885, "created_at": "2025-06-03T09:55:20.222111+00:00"} {"global_step": 237431, "acc_step": 0, "speed/wps": 5517.106743726178, "speed/FLOPS": 243827878960445.16, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.050318412482738495, "optim/lr": 5.56914339834802e-06, "optim/total_tokens": 1991715586048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2808680534362793, "created_at": "2025-06-03T09:55:23.197342+00:00"} {"global_step": 237432, "acc_step": 0, "speed/wps": 5521.052562254403, "speed/FLOPS": 244002263942862.6, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04717414826154709, "optim/lr": 5.565596173253473e-06, "optim/total_tokens": 1991723974656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2761340141296387, "created_at": "2025-06-03T09:55:26.169410+00:00"} {"global_step": 237433, "acc_step": 0, "speed/wps": 5519.248426011888, "speed/FLOPS": 243922530355349.84, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0005, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04661424458026886, "optim/lr": 5.5620489481591486e-06, "optim/total_tokens": 1991732363264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.259706735610962, "created_at": "2025-06-03T09:55:29.148059+00:00"} {"global_step": 237434, "acc_step": 0, "speed/wps": 5519.854934818995, "speed/FLOPS": 243949334940230.5, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04655115306377411, "optim/lr": 5.558501723064602e-06, "optim/total_tokens": 1991740751872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2754474878311157, "created_at": "2025-06-03T09:55:32.123538+00:00"} {"global_step": 237435, "acc_step": 0, "speed/wps": 5513.498366490048, "speed/FLOPS": 243668407155957.2, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047259505838155746, "optim/lr": 5.554954497970055e-06, "optim/total_tokens": 1991749140480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2561264038085938, "created_at": "2025-06-03T09:55:35.099783+00:00"} {"global_step": 237436, "acc_step": 0, "speed/wps": 5519.117682580455, "speed/FLOPS": 243916752164886.06, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04797574505209923, "optim/lr": 5.5514072728755085e-06, "optim/total_tokens": 1991757529088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.277329444885254, "created_at": "2025-06-03T09:55:38.074536+00:00"} {"global_step": 237437, "acc_step": 0, "speed/wps": 5524.72069144697, "speed/FLOPS": 244164376477986.84, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04723745957016945, "optim/lr": 5.547860047781183e-06, "optim/total_tokens": 1991765917696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2589505910873413, "created_at": "2025-06-03T09:55:41.045615+00:00"} {"global_step": 237438, "acc_step": 0, "speed/wps": 5518.297452728512, "speed/FLOPS": 243880502203747.16, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0476883128285408, "optim/lr": 5.544312822686637e-06, "optim/total_tokens": 1991774306304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2693209648132324, "created_at": "2025-06-03T09:55:44.019097+00:00"} {"global_step": 237439, "acc_step": 0, "speed/wps": 5508.231031056178, "speed/FLOPS": 243435617890446.9, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04759055748581886, "optim/lr": 5.54076559759209e-06, "optim/total_tokens": 1991782694912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.263241171836853, "created_at": "2025-06-03T09:55:47.000319+00:00"} {"global_step": 237440, "acc_step": 0, "speed/wps": 5521.102720976557, "speed/FLOPS": 244004480701646.2, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04930739849805832, "optim/lr": 5.537218372497765e-06, "optim/total_tokens": 1991791083520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.271569848060608, "created_at": "2025-06-03T09:55:49.976548+00:00"} {"global_step": 237441, "acc_step": 0, "speed/wps": 5516.527600385405, "speed/FLOPS": 243802283789107.3, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04773872718214989, "optim/lr": 5.533671147403219e-06, "optim/total_tokens": 1991799472128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.264019250869751, "created_at": "2025-06-03T09:55:52.954394+00:00"} {"global_step": 237442, "acc_step": 0, "speed/wps": 5511.369002250841, "speed/FLOPS": 243574300155658.44, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.29 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.29, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047863706946372986, "optim/lr": 5.530123922308672e-06, "optim/total_tokens": 1991807860736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2611464262008667, "created_at": "2025-06-03T09:55:55.931979+00:00"} {"global_step": 237443, "acc_step": 0, "speed/wps": 5516.164306315465, "speed/FLOPS": 243786228050723.6, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048854123800992966, "optim/lr": 5.526576697214125e-06, "optim/total_tokens": 1991816249344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2486681938171387, "created_at": "2025-06-03T09:55:58.911392+00:00"} {"global_step": 237444, "acc_step": 0, "speed/wps": 5510.771272537792, "speed/FLOPS": 243547883561799.72, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04687945544719696, "optim/lr": 5.523029472119801e-06, "optim/total_tokens": 1991824637952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2487791776657104, "created_at": "2025-06-03T09:56:01.889015+00:00"} {"global_step": 237445, "acc_step": 0, "speed/wps": 5510.370943371553, "speed/FLOPS": 243530191061722.34, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0479704812169075, "optim/lr": 5.519482247025253e-06, "optim/total_tokens": 1991833026560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2615118026733398, "created_at": "2025-06-03T09:56:04.867969+00:00"} {"global_step": 237446, "acc_step": 0, "speed/wps": 5522.720933444916, "speed/FLOPS": 244075997409985.4, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04725213348865509, "optim/lr": 5.515935021930707e-06, "optim/total_tokens": 1991841415168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2573002576828003, "created_at": "2025-06-03T09:56:07.840419+00:00"} {"global_step": 237447, "acc_step": 0, "speed/wps": 5525.843216864023, "speed/FLOPS": 244213986355814.66, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049803782254457474, "optim/lr": 5.5123877968361606e-06, "optim/total_tokens": 1991849803776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.268832802772522, "created_at": "2025-06-03T09:56:10.814847+00:00"} {"global_step": 237448, "acc_step": 0, "speed/wps": 5520.254613972963, "speed/FLOPS": 243966998713092.5, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04882104694843292, "optim/lr": 5.508840571741835e-06, "optim/total_tokens": 1991858192384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2644624710083008, "created_at": "2025-06-03T09:56:13.787327+00:00"} {"global_step": 237449, "acc_step": 0, "speed/wps": 5521.010980744365, "speed/FLOPS": 244000426252952.38, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047415148466825485, "optim/lr": 5.505293346647289e-06, "optim/total_tokens": 1991866580992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2648192644119263, "created_at": "2025-06-03T09:56:16.760842+00:00"} {"global_step": 237450, "acc_step": 0, "speed/wps": 5502.875351946605, "speed/FLOPS": 243198924286654.53, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04741225391626358, "optim/lr": 5.501746121552742e-06, "optim/total_tokens": 1991874969600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2634221315383911, "created_at": "2025-06-03T09:56:19.747044+00:00"} {"global_step": 237451, "acc_step": 0, "speed/wps": 5507.999650805846, "speed/FLOPS": 243425392067693.72, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05007675290107727, "optim/lr": 5.498198896458195e-06, "optim/total_tokens": 1991883358208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2491495609283447, "created_at": "2025-06-03T09:56:22.726117+00:00"} {"global_step": 237452, "acc_step": 0, "speed/wps": 5524.292128899354, "speed/FLOPS": 244145436206964.2, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04662257060408592, "optim/lr": 5.494651671363871e-06, "optim/total_tokens": 1991891746816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2473959922790527, "created_at": "2025-06-03T09:56:25.696531+00:00"} {"global_step": 237453, "acc_step": 0, "speed/wps": 5509.51003176469, "speed/FLOPS": 243492143175244.1, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.28 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.28, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048938993364572525, "optim/lr": 5.4911044462693235e-06, "optim/total_tokens": 1991900135424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2526170015335083, "created_at": "2025-06-03T09:56:28.678357+00:00"} {"global_step": 237454, "acc_step": 0, "speed/wps": 5522.087159445515, "speed/FLOPS": 244047987843161.28, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04872628673911095, "optim/lr": 5.487557221174777e-06, "optim/total_tokens": 1991908524032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2538341283798218, "created_at": "2025-06-03T09:56:31.655358+00:00"} {"global_step": 237455, "acc_step": 0, "speed/wps": 5520.716110163784, "speed/FLOPS": 243987394482575.16, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04747908562421799, "optim/lr": 5.484009996080231e-06, "optim/total_tokens": 1991916912640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2695626020431519, "created_at": "2025-06-03T09:56:34.627860+00:00"} {"global_step": 237456, "acc_step": 0, "speed/wps": 5514.347273525952, "speed/FLOPS": 243705924501844.03, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04671023041009903, "optim/lr": 5.480462770985905e-06, "optim/total_tokens": 1991925301248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2603498697280884, "created_at": "2025-06-03T09:56:37.603375+00:00"} {"global_step": 237457, "acc_step": 0, "speed/wps": 5530.659588910299, "speed/FLOPS": 244426845347833.12, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04837404936552048, "optim/lr": 5.476915545891359e-06, "optim/total_tokens": 1991933689856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2588884830474854, "created_at": "2025-06-03T09:56:40.571791+00:00"} {"global_step": 237458, "acc_step": 0, "speed/wps": 5518.666883202305, "speed/FLOPS": 243896829139772.22, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04795784875750542, "optim/lr": 5.473368320796812e-06, "optim/total_tokens": 1991942078464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.260042667388916, "created_at": "2025-06-03T09:56:43.547522+00:00"} {"global_step": 237459, "acc_step": 0, "speed/wps": 5525.901588993153, "speed/FLOPS": 244216566105146.56, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046954501420259476, "optim/lr": 5.469821095702265e-06, "optim/total_tokens": 1991950467072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.269078254699707, "created_at": "2025-06-03T09:56:46.516859+00:00"} {"global_step": 237460, "acc_step": 0, "speed/wps": 5508.9154187564, "speed/FLOPS": 243465864323782.94, "speed/curr_iter_time": 2.9731, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9731, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04630663990974426, "optim/lr": 5.466273870607941e-06, "optim/total_tokens": 1991958855680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2556145191192627, "created_at": "2025-06-03T09:56:49.497558+00:00"} {"global_step": 237461, "acc_step": 0, "speed/wps": 5508.373911960376, "speed/FLOPS": 243441932495081.72, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04734589904546738, "optim/lr": 5.462726645513394e-06, "optim/total_tokens": 1991967244288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2775254249572754, "created_at": "2025-06-03T09:56:52.476326+00:00"} {"global_step": 237462, "acc_step": 0, "speed/wps": 5526.814782416203, "speed/FLOPS": 244256924580297.72, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047455813735723495, "optim/lr": 5.459179420418847e-06, "optim/total_tokens": 1991975632896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.254833459854126, "created_at": "2025-06-03T09:56:55.445361+00:00"} {"global_step": 237463, "acc_step": 0, "speed/wps": 5516.269075783909, "speed/FLOPS": 243790858324970.06, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04829378426074982, "optim/lr": 5.4556321953243e-06, "optim/total_tokens": 1991984021504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2664828300476074, "created_at": "2025-06-03T09:56:58.422954+00:00"} {"global_step": 237464, "acc_step": 0, "speed/wps": 5513.747057214587, "speed/FLOPS": 243679398013067.28, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.27 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.27, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047801341861486435, "optim/lr": 5.4520849702299756e-06, "optim/total_tokens": 1991992410112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2633088827133179, "created_at": "2025-06-03T09:57:01.402212+00:00"} {"global_step": 237465, "acc_step": 0, "speed/wps": 5523.689023039002, "speed/FLOPS": 244118782014912.25, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04662998765707016, "optim/lr": 5.448537745135429e-06, "optim/total_tokens": 1992000798720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2776110172271729, "created_at": "2025-06-03T09:57:04.373845+00:00"} {"global_step": 237466, "acc_step": 0, "speed/wps": 5524.972368054958, "speed/FLOPS": 244175499295862.25, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04735485091805458, "optim/lr": 5.444990520040882e-06, "optim/total_tokens": 1992009187328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2613341808319092, "created_at": "2025-06-03T09:57:07.344712+00:00"} {"global_step": 237467, "acc_step": 0, "speed/wps": 5522.8609069365875, "speed/FLOPS": 244082183521868.0, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049138687551021576, "optim/lr": 5.4414432949463355e-06, "optim/total_tokens": 1992017575936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.251873254776001, "created_at": "2025-06-03T09:57:10.319742+00:00"} {"global_step": 237468, "acc_step": 0, "speed/wps": 5520.921115222798, "speed/FLOPS": 243996454656872.56, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04694141820073128, "optim/lr": 5.437896069852011e-06, "optim/total_tokens": 1992025964544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.259727120399475, "created_at": "2025-06-03T09:57:13.291789+00:00"} {"global_step": 237469, "acc_step": 0, "speed/wps": 5524.044792166369, "speed/FLOPS": 244134505189350.4, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04755859822034836, "optim/lr": 5.434348844757464e-06, "optim/total_tokens": 1992034353152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.260101556777954, "created_at": "2025-06-03T09:57:16.263630+00:00"} {"global_step": 237470, "acc_step": 0, "speed/wps": 5514.966678388433, "speed/FLOPS": 243733299026364.22, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048530831933021545, "optim/lr": 5.430801619662917e-06, "optim/total_tokens": 1992042741760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2560802698135376, "created_at": "2025-06-03T09:57:19.239110+00:00"} {"global_step": 237471, "acc_step": 0, "speed/wps": 5525.181123489584, "speed/FLOPS": 244184725217565.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04711112007498741, "optim/lr": 5.427254394568593e-06, "optim/total_tokens": 1992051130368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2637375593185425, "created_at": "2025-06-03T09:57:22.213845+00:00"} {"global_step": 237472, "acc_step": 0, "speed/wps": 5522.37548679715, "speed/FLOPS": 244060730436310.38, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04716711863875389, "optim/lr": 5.423707169474046e-06, "optim/total_tokens": 1992059518976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2513444423675537, "created_at": "2025-06-03T09:57:25.190495+00:00"} {"global_step": 237473, "acc_step": 0, "speed/wps": 5518.284361840192, "speed/FLOPS": 243879923653488.66, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04710828885436058, "optim/lr": 5.420159944379499e-06, "optim/total_tokens": 1992067907584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.249598741531372, "created_at": "2025-06-03T09:57:28.166992+00:00"} {"global_step": 237474, "acc_step": 0, "speed/wps": 5522.932303821836, "speed/FLOPS": 244085338898753.62, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047049786895513535, "optim/lr": 5.416612719284952e-06, "optim/total_tokens": 1992076296192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2648334503173828, "created_at": "2025-06-03T09:57:31.138203+00:00"} {"global_step": 237475, "acc_step": 0, "speed/wps": 5526.596840188463, "speed/FLOPS": 244247292649361.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04677309840917587, "optim/lr": 5.413065494190628e-06, "optim/total_tokens": 1992084684800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.269295334815979, "created_at": "2025-06-03T09:57:34.107320+00:00"} {"global_step": 237476, "acc_step": 0, "speed/wps": 5523.516517085633, "speed/FLOPS": 244111158134738.84, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04679161682724953, "optim/lr": 5.409518269096081e-06, "optim/total_tokens": 1992093073408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2607208490371704, "created_at": "2025-06-03T09:57:37.078305+00:00"} {"global_step": 237477, "acc_step": 0, "speed/wps": 5514.406119076848, "speed/FLOPS": 243708525173994.8, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.26 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.26, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04725348949432373, "optim/lr": 5.405971044001534e-06, "optim/total_tokens": 1992101462016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2622942924499512, "created_at": "2025-06-03T09:57:40.054226+00:00"} {"global_step": 237478, "acc_step": 0, "speed/wps": 5534.47430004565, "speed/FLOPS": 244595436054554.03, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.21, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04656464606523514, "optim/lr": 5.4024238189069876e-06, "optim/total_tokens": 1992109850624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2705379724502563, "created_at": "2025-06-03T09:57:43.018793+00:00"} {"global_step": 237479, "acc_step": 0, "speed/wps": 5523.260984252086, "speed/FLOPS": 244099864891431.72, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04748333618044853, "optim/lr": 5.398876593812663e-06, "optim/total_tokens": 1992118239232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2480684518814087, "created_at": "2025-06-03T09:57:45.989533+00:00"} {"global_step": 237480, "acc_step": 0, "speed/wps": 5520.655944434226, "speed/FLOPS": 243984735465284.8, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047130510210990906, "optim/lr": 5.395329368718116e-06, "optim/total_tokens": 1992126627840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2613662481307983, "created_at": "2025-06-03T09:57:48.965330+00:00"} {"global_step": 237481, "acc_step": 0, "speed/wps": 5527.6197886035525, "speed/FLOPS": 244292501733383.38, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04682578518986702, "optim/lr": 5.3917821436235695e-06, "optim/total_tokens": 1992135016448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.259925365447998, "created_at": "2025-06-03T09:57:51.935009+00:00"} {"global_step": 237482, "acc_step": 0, "speed/wps": 5524.34124405719, "speed/FLOPS": 244147606845546.38, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04786555841565132, "optim/lr": 5.388234918529022e-06, "optim/total_tokens": 1992143405056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2657643556594849, "created_at": "2025-06-03T09:57:54.908911+00:00"} {"global_step": 237483, "acc_step": 0, "speed/wps": 5509.5816282758715, "speed/FLOPS": 243495307374574.12, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047112226486206055, "optim/lr": 5.384687693434698e-06, "optim/total_tokens": 1992151793664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.259812831878662, "created_at": "2025-06-03T09:57:57.889283+00:00"} {"global_step": 237484, "acc_step": 0, "speed/wps": 5513.138446445226, "speed/FLOPS": 243652500532213.84, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047230299562215805, "optim/lr": 5.381140468340151e-06, "optim/total_tokens": 1992160182272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2698988914489746, "created_at": "2025-06-03T09:58:00.865330+00:00"} {"global_step": 237485, "acc_step": 0, "speed/wps": 5509.621236775706, "speed/FLOPS": 243497057867532.12, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04679177701473236, "optim/lr": 5.377593243245604e-06, "optim/total_tokens": 1992168570880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.263551115989685, "created_at": "2025-06-03T09:58:03.843496+00:00"} {"global_step": 237486, "acc_step": 0, "speed/wps": 5507.306351650839, "speed/FLOPS": 243394751793669.2, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047001563012599945, "optim/lr": 5.374046018151058e-06, "optim/total_tokens": 1992176959488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2679367065429688, "created_at": "2025-06-03T09:58:06.828314+00:00"} {"global_step": 237487, "acc_step": 0, "speed/wps": 5513.437709140977, "speed/FLOPS": 243665726411600.7, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047929324209690094, "optim/lr": 5.370498793056733e-06, "optim/total_tokens": 1992185348096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2529222965240479, "created_at": "2025-06-03T09:58:09.804947+00:00"} {"global_step": 237488, "acc_step": 0, "speed/wps": 5529.39670099344, "speed/FLOPS": 244371032165954.3, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046986982226371765, "optim/lr": 5.366951567962186e-06, "optim/total_tokens": 1992193736704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2683947086334229, "created_at": "2025-06-03T09:58:12.772606+00:00"} {"global_step": 237489, "acc_step": 0, "speed/wps": 5519.765205212116, "speed/FLOPS": 243945369350884.2, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.25 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.25, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047009386122226715, "optim/lr": 5.36340434286764e-06, "optim/total_tokens": 1992202125312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.264281988143921, "created_at": "2025-06-03T09:58:15.749065+00:00"} {"global_step": 237490, "acc_step": 0, "speed/wps": 5529.982353568287, "speed/FLOPS": 244396915012120.9, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04733864963054657, "optim/lr": 5.359857117773092e-06, "optim/total_tokens": 1992210513920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.265650749206543, "created_at": "2025-06-03T09:58:18.717949+00:00"} {"global_step": 237491, "acc_step": 0, "speed/wps": 5522.123843479128, "speed/FLOPS": 244049609089681.06, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04688747227191925, "optim/lr": 5.356309892678768e-06, "optim/total_tokens": 1992218902528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.253229022026062, "created_at": "2025-06-03T09:58:21.694982+00:00"} {"global_step": 237492, "acc_step": 0, "speed/wps": 5528.758500087972, "speed/FLOPS": 244342826952540.97, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0473732091486454, "optim/lr": 5.3527626675842215e-06, "optim/total_tokens": 1992227291136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2486413717269897, "created_at": "2025-06-03T09:58:24.666441+00:00"} {"global_step": 237493, "acc_step": 0, "speed/wps": 5526.284808674785, "speed/FLOPS": 244233502453578.56, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04857119917869568, "optim/lr": 5.349215442489674e-06, "optim/total_tokens": 1992235679744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.267451286315918, "created_at": "2025-06-03T09:58:27.635494+00:00"} {"global_step": 237494, "acc_step": 0, "speed/wps": 5515.708454028528, "speed/FLOPS": 243766081712904.5, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048044923692941666, "optim/lr": 5.345668217395128e-06, "optim/total_tokens": 1992244068352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2518430948257446, "created_at": "2025-06-03T09:58:30.614420+00:00"} {"global_step": 237495, "acc_step": 0, "speed/wps": 5527.670691992726, "speed/FLOPS": 244294751402637.66, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0490543432533741, "optim/lr": 5.3421209923008026e-06, "optim/total_tokens": 1992252456960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.274726152420044, "created_at": "2025-06-03T09:58:33.583027+00:00"} {"global_step": 237496, "acc_step": 0, "speed/wps": 5533.715150502805, "speed/FLOPS": 244561885530439.88, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.17, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04661170020699501, "optim/lr": 5.338573767206256e-06, "optim/total_tokens": 1992260845568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2700241804122925, "created_at": "2025-06-03T09:58:36.548605+00:00"} {"global_step": 237497, "acc_step": 0, "speed/wps": 5527.879035624894, "speed/FLOPS": 244303959124780.1, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04696488380432129, "optim/lr": 5.33502654211171e-06, "optim/total_tokens": 1992269234176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2706083059310913, "created_at": "2025-06-03T09:58:39.516396+00:00"} {"global_step": 237498, "acc_step": 0, "speed/wps": 5525.634672600904, "speed/FLOPS": 244204769766811.1, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05039466544985771, "optim/lr": 5.3314793170173844e-06, "optim/total_tokens": 1992277622784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2524136304855347, "created_at": "2025-06-03T09:58:42.488830+00:00"} {"global_step": 237499, "acc_step": 0, "speed/wps": 5515.985922240327, "speed/FLOPS": 243778344387654.97, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04667558893561363, "optim/lr": 5.327932091922838e-06, "optim/total_tokens": 1992286011392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2693253755569458, "created_at": "2025-06-03T09:58:45.463653+00:00"} {"global_step": 237500, "acc_step": 0, "speed/wps": 5516.326718244798, "speed/FLOPS": 243793405826700.5, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048176757991313934, "optim/lr": 5.324384866828292e-06, "optim/total_tokens": 1992294400000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2592480182647705, "created_at": "2025-06-03T09:58:48.439960+00:00"} {"global_step": 237501, "acc_step": 0, "speed/wps": 5505.168555285982, "speed/FLOPS": 243300272136576.22, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04876786470413208, "optim/lr": 5.320837641733744e-06, "optim/total_tokens": 1992302788608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.258410096168518, "created_at": "2025-06-03T09:58:51.420775+00:00"} {"global_step": 237502, "acc_step": 0, "speed/wps": 5513.277370912328, "speed/FLOPS": 243658640282579.84, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04697781428694725, "optim/lr": 5.31729041663942e-06, "optim/total_tokens": 1992311177216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2526111602783203, "created_at": "2025-06-03T09:58:54.402459+00:00"} {"global_step": 237503, "acc_step": 0, "speed/wps": 5511.5799660393295, "speed/FLOPS": 243583623675299.06, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.24 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.24, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047014955431222916, "optim/lr": 5.313743191544873e-06, "optim/total_tokens": 1992319565824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.276084303855896, "created_at": "2025-06-03T09:58:57.380376+00:00"} {"global_step": 237504, "acc_step": 0, "speed/wps": 5522.27599117625, "speed/FLOPS": 244056333239131.34, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047404590994119644, "optim/lr": 5.310195966450326e-06, "optim/total_tokens": 1992327954432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2782111167907715, "created_at": "2025-06-03T09:59:00.357218+00:00"} {"global_step": 237505, "acc_step": 0, "speed/wps": 5529.704126859667, "speed/FLOPS": 244384618815693.28, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046725936233997345, "optim/lr": 5.30664874135578e-06, "optim/total_tokens": 1992336343040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2586122751235962, "created_at": "2025-06-03T09:59:03.326132+00:00"} {"global_step": 237506, "acc_step": 0, "speed/wps": 5513.56089919264, "speed/FLOPS": 243671170781340.38, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0473572313785553, "optim/lr": 5.303101516261455e-06, "optim/total_tokens": 1992344731648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2649582624435425, "created_at": "2025-06-03T09:59:06.302303+00:00"} {"global_step": 237507, "acc_step": 0, "speed/wps": 5516.04447242377, "speed/FLOPS": 243780932006076.12, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046764858067035675, "optim/lr": 5.299554291166908e-06, "optim/total_tokens": 1992353120256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.253929615020752, "created_at": "2025-06-03T09:59:09.276553+00:00"} {"global_step": 237508, "acc_step": 0, "speed/wps": 5533.932299316609, "speed/FLOPS": 244571482396541.62, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.26, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04686153680086136, "optim/lr": 5.296007066072361e-06, "optim/total_tokens": 1992361508864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2646639347076416, "created_at": "2025-06-03T09:59:12.245689+00:00"} {"global_step": 237509, "acc_step": 0, "speed/wps": 5519.540235674609, "speed/FLOPS": 243935426848824.88, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04770750179886818, "optim/lr": 5.2924598409778146e-06, "optim/total_tokens": 1992369897472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2627993822097778, "created_at": "2025-06-03T09:59:15.218318+00:00"} {"global_step": 237510, "acc_step": 0, "speed/wps": 5533.8843612570645, "speed/FLOPS": 244569363779679.0, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04710175842046738, "optim/lr": 5.28891261588349e-06, "optim/total_tokens": 1992378286080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.271931767463684, "created_at": "2025-06-03T09:59:18.183325+00:00"} {"global_step": 237511, "acc_step": 0, "speed/wps": 5511.713305057753, "speed/FLOPS": 243589516577422.44, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04931911081075668, "optim/lr": 5.285365390788943e-06, "optim/total_tokens": 1992386674688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2759159803390503, "created_at": "2025-06-03T09:59:21.160260+00:00"} {"global_step": 237512, "acc_step": 0, "speed/wps": 5518.262707550184, "speed/FLOPS": 243878966644707.0, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04829232767224312, "optim/lr": 5.2818181656943965e-06, "optim/total_tokens": 1992395063296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2560265064239502, "created_at": "2025-06-03T09:59:24.133649+00:00"} {"global_step": 237513, "acc_step": 0, "speed/wps": 5517.08920966636, "speed/FLOPS": 243827104044748.66, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04649433121085167, "optim/lr": 5.27827094059985e-06, "optim/total_tokens": 1992403451904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.25798761844635, "created_at": "2025-06-03T09:59:27.107430+00:00"} {"global_step": 237514, "acc_step": 0, "speed/wps": 5510.696099039863, "speed/FLOPS": 243544561277964.06, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04702218249440193, "optim/lr": 5.274723715505525e-06, "optim/total_tokens": 1992411840512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2742341756820679, "created_at": "2025-06-03T09:59:30.089377+00:00"} {"global_step": 237515, "acc_step": 0, "speed/wps": 5508.400941135135, "speed/FLOPS": 243443127046258.22, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.23 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.23, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05064205825328827, "optim/lr": 5.271176490410978e-06, "optim/total_tokens": 1992420229120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2571673393249512, "created_at": "2025-06-03T09:59:33.070206+00:00"} {"global_step": 237516, "acc_step": 0, "speed/wps": 5527.910178723612, "speed/FLOPS": 244305335490338.62, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04687042161822319, "optim/lr": 5.267629265316431e-06, "optim/total_tokens": 1992428617728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.249382734298706, "created_at": "2025-06-03T09:59:36.040604+00:00"} {"global_step": 237517, "acc_step": 0, "speed/wps": 5517.3019703620785, "speed/FLOPS": 243836506978491.44, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04921945929527283, "optim/lr": 5.264082040221885e-06, "optim/total_tokens": 1992437006336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2580726146697998, "created_at": "2025-06-03T09:59:39.014652+00:00"} {"global_step": 237518, "acc_step": 0, "speed/wps": 5516.875401378879, "speed/FLOPS": 243817654812812.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04899327829480171, "optim/lr": 5.26053481512756e-06, "optim/total_tokens": 1992445394944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.25806725025177, "created_at": "2025-06-03T09:59:41.989681+00:00"} {"global_step": 237519, "acc_step": 0, "speed/wps": 5516.974015187322, "speed/FLOPS": 243822013038393.97, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04781443998217583, "optim/lr": 5.256987590033013e-06, "optim/total_tokens": 1992453783552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2498483657836914, "created_at": "2025-06-03T09:59:44.970016+00:00"} {"global_step": 237520, "acc_step": 0, "speed/wps": 5502.895915674673, "speed/FLOPS": 243199833098180.44, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047921113669872284, "optim/lr": 5.253440364938467e-06, "optim/total_tokens": 1992462172160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.260615348815918, "created_at": "2025-06-03T09:59:47.951923+00:00"} {"global_step": 237521, "acc_step": 0, "speed/wps": 5524.413506727433, "speed/FLOPS": 244150800485697.22, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048815082758665085, "optim/lr": 5.24989313984392e-06, "optim/total_tokens": 1992470560768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2836803197860718, "created_at": "2025-06-03T09:59:50.921689+00:00"} {"global_step": 237522, "acc_step": 0, "speed/wps": 5529.387124506075, "speed/FLOPS": 244370608934229.7, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04846906289458275, "optim/lr": 5.246345914749595e-06, "optim/total_tokens": 1992478949376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.258785605430603, "created_at": "2025-06-03T09:59:53.890723+00:00"} {"global_step": 237523, "acc_step": 0, "speed/wps": 5516.670832459667, "speed/FLOPS": 243808613913661.47, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048781510442495346, "optim/lr": 5.2427986896550485e-06, "optim/total_tokens": 1992487337984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2594242095947266, "created_at": "2025-06-03T09:59:56.864707+00:00"} {"global_step": 237524, "acc_step": 0, "speed/wps": 5532.04318853116, "speed/FLOPS": 244487993369170.34, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04706442728638649, "optim/lr": 5.239251464560501e-06, "optim/total_tokens": 1992495726592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2644892930984497, "created_at": "2025-06-03T09:59:59.830710+00:00"} {"global_step": 237525, "acc_step": 0, "speed/wps": 5524.340351953335, "speed/FLOPS": 244147567419122.2, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.62, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04755135998129845, "optim/lr": 5.235704239466177e-06, "optim/total_tokens": 1992504115200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2745778560638428, "created_at": "2025-06-03T10:00:02.800435+00:00"} {"global_step": 237526, "acc_step": 0, "speed/wps": 5515.2171000907465, "speed/FLOPS": 243744366383832.0, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04705174267292023, "optim/lr": 5.23215701437163e-06, "optim/total_tokens": 1992512503808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2717710733413696, "created_at": "2025-06-03T10:00:05.774982+00:00"} {"global_step": 237527, "acc_step": 0, "speed/wps": 5509.8790208461805, "speed/FLOPS": 243508450603988.62, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.22 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.22, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04632943868637085, "optim/lr": 5.228609789277083e-06, "optim/total_tokens": 1992520892416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.261109709739685, "created_at": "2025-06-03T10:00:08.753990+00:00"} {"global_step": 237528, "acc_step": 0, "speed/wps": 5519.567775883104, "speed/FLOPS": 243936643985076.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04853862151503563, "optim/lr": 5.225062564182537e-06, "optim/total_tokens": 1992529281024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2714189291000366, "created_at": "2025-06-03T10:00:11.726410+00:00"} {"global_step": 237529, "acc_step": 0, "speed/wps": 5524.593546233517, "speed/FLOPS": 244158757310340.44, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04763052985072136, "optim/lr": 5.221515339088212e-06, "optim/total_tokens": 1992537669632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2683638334274292, "created_at": "2025-06-03T10:00:14.699130+00:00"} {"global_step": 237530, "acc_step": 0, "speed/wps": 5522.398044917859, "speed/FLOPS": 244061727389782.78, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04712097346782684, "optim/lr": 5.217968113993665e-06, "optim/total_tokens": 1992546058240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.245803952217102, "created_at": "2025-06-03T10:00:17.670004+00:00"} {"global_step": 237531, "acc_step": 0, "speed/wps": 5516.068460664708, "speed/FLOPS": 243781992163542.66, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04650922864675522, "optim/lr": 5.214420888899119e-06, "optim/total_tokens": 1992554446848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.259540319442749, "created_at": "2025-06-03T10:00:20.647221+00:00"} {"global_step": 237532, "acc_step": 0, "speed/wps": 5518.235765852161, "speed/FLOPS": 243877775959554.5, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04745796322822571, "optim/lr": 5.210873663804571e-06, "optim/total_tokens": 1992562835456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2678296566009521, "created_at": "2025-06-03T10:00:23.620995+00:00"} {"global_step": 237533, "acc_step": 0, "speed/wps": 5508.527862148288, "speed/FLOPS": 243448736305398.9, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047175947576761246, "optim/lr": 5.207326438710247e-06, "optim/total_tokens": 1992571224064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2550185918807983, "created_at": "2025-06-03T10:00:26.604727+00:00"} {"global_step": 237534, "acc_step": 0, "speed/wps": 5515.062799557619, "speed/FLOPS": 243737547090049.47, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04715485870838165, "optim/lr": 5.2037792136157006e-06, "optim/total_tokens": 1992579612672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2581214904785156, "created_at": "2025-06-03T10:00:29.582671+00:00"} {"global_step": 237535, "acc_step": 0, "speed/wps": 5520.297544755685, "speed/FLOPS": 243968896033949.12, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04699638858437538, "optim/lr": 5.200231988521153e-06, "optim/total_tokens": 1992588001280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2730140686035156, "created_at": "2025-06-03T10:00:32.558917+00:00"} {"global_step": 237536, "acc_step": 0, "speed/wps": 5520.010226751285, "speed/FLOPS": 243956198048781.53, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04775428771972656, "optim/lr": 5.196684763426607e-06, "optim/total_tokens": 1992596389888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2561455965042114, "created_at": "2025-06-03T10:00:35.535351+00:00"} {"global_step": 237537, "acc_step": 0, "speed/wps": 5516.236666563784, "speed/FLOPS": 243789426003325.97, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047164611518383026, "optim/lr": 5.1931375383322824e-06, "optim/total_tokens": 1992604778496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.276143193244934, "created_at": "2025-06-03T10:00:38.513560+00:00"} {"global_step": 237538, "acc_step": 0, "speed/wps": 5519.039451596066, "speed/FLOPS": 243913294755798.56, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.21 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.21, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048027317970991135, "optim/lr": 5.189590313237735e-06, "optim/total_tokens": 1992613167104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2705622911453247, "created_at": "2025-06-03T10:00:41.486283+00:00"} {"global_step": 237539, "acc_step": 0, "speed/wps": 5528.403274968399, "speed/FLOPS": 244327127820462.84, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04630814865231514, "optim/lr": 5.186043088143189e-06, "optim/total_tokens": 1992621555712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2572895288467407, "created_at": "2025-06-03T10:00:44.460906+00:00"} {"global_step": 237540, "acc_step": 0, "speed/wps": 5521.669391746163, "speed/FLOPS": 244029524649178.84, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046869050711393356, "optim/lr": 5.1824958630486416e-06, "optim/total_tokens": 1992629944320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.260766625404358, "created_at": "2025-06-03T10:00:47.433659+00:00"} {"global_step": 237541, "acc_step": 0, "speed/wps": 5522.6956567909265, "speed/FLOPS": 244074880311256.72, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047020815312862396, "optim/lr": 5.178948637954317e-06, "optim/total_tokens": 1992638332928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2630888223648071, "created_at": "2025-06-03T10:00:50.408779+00:00"} {"global_step": 237542, "acc_step": 0, "speed/wps": 5523.147697257174, "speed/FLOPS": 244094858186111.97, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046984463930130005, "optim/lr": 5.175401412859771e-06, "optim/total_tokens": 1992646721536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2686043977737427, "created_at": "2025-06-03T10:00:53.384132+00:00"} {"global_step": 237543, "acc_step": 0, "speed/wps": 5518.581062635349, "speed/FLOPS": 243893036309982.22, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04889702424407005, "optim/lr": 5.1718541877652235e-06, "optim/total_tokens": 1992655110144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2714300155639648, "created_at": "2025-06-03T10:00:56.357218+00:00"} {"global_step": 237544, "acc_step": 0, "speed/wps": 5515.781378206234, "speed/FLOPS": 243769304588299.3, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04699978604912758, "optim/lr": 5.168306962670677e-06, "optim/total_tokens": 1992663498752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2607100009918213, "created_at": "2025-06-03T10:00:59.332238+00:00"} {"global_step": 237545, "acc_step": 0, "speed/wps": 5518.235060929079, "speed/FLOPS": 243877744805562.38, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04676227271556854, "optim/lr": 5.164759737576353e-06, "optim/total_tokens": 1992671887360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2548295259475708, "created_at": "2025-06-03T10:01:02.310093+00:00"} {"global_step": 237546, "acc_step": 0, "speed/wps": 5533.110726872213, "speed/FLOPS": 244535173099688.28, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04807932302355766, "optim/lr": 5.161212512481805e-06, "optim/total_tokens": 1992680275968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2607792615890503, "created_at": "2025-06-03T10:01:05.277032+00:00"} {"global_step": 237547, "acc_step": 0, "speed/wps": 5527.314880725577, "speed/FLOPS": 244279026365836.8, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04682915657758713, "optim/lr": 5.157665287387259e-06, "optim/total_tokens": 1992688664576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2578191757202148, "created_at": "2025-06-03T10:01:08.250391+00:00"} {"global_step": 237548, "acc_step": 0, "speed/wps": 5517.197967534719, "speed/FLOPS": 243831910585856.9, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.2 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.2, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046687960624694824, "optim/lr": 5.154118062292712e-06, "optim/total_tokens": 1992697053184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2645002603530884, "created_at": "2025-06-03T10:01:11.227052+00:00"} {"global_step": 237549, "acc_step": 0, "speed/wps": 5527.695701135848, "speed/FLOPS": 244295856678755.28, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047467462718486786, "optim/lr": 5.150570837198387e-06, "optim/total_tokens": 1992705441792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2509177923202515, "created_at": "2025-06-03T10:01:14.201312+00:00"} {"global_step": 237550, "acc_step": 0, "speed/wps": 5530.3299995417965, "speed/FLOPS": 244412279184736.62, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049501899629831314, "optim/lr": 5.147023612103841e-06, "optim/total_tokens": 1992713830400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2477974891662598, "created_at": "2025-06-03T10:01:17.173083+00:00"} {"global_step": 237551, "acc_step": 0, "speed/wps": 5523.823024920841, "speed/FLOPS": 244124704212205.75, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04694607853889465, "optim/lr": 5.143476387009294e-06, "optim/total_tokens": 1992722219008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2852672338485718, "created_at": "2025-06-03T10:01:20.143696+00:00"} {"global_step": 237552, "acc_step": 0, "speed/wps": 5524.283091805443, "speed/FLOPS": 244145036813669.38, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047098103910684586, "optim/lr": 5.139929161914969e-06, "optim/total_tokens": 1992730607616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2679188251495361, "created_at": "2025-06-03T10:01:23.113460+00:00"} {"global_step": 237553, "acc_step": 0, "speed/wps": 5520.522065416709, "speed/FLOPS": 243978818697965.5, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048600830137729645, "optim/lr": 5.136381936820422e-06, "optim/total_tokens": 1992738996224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2564400434494019, "created_at": "2025-06-03T10:01:26.085737+00:00"} {"global_step": 237554, "acc_step": 0, "speed/wps": 5540.295967254994, "speed/FLOPS": 244852723947213.0, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.08, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04739658161997795, "optim/lr": 5.1328347117258755e-06, "optim/total_tokens": 1992747384832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2496895790100098, "created_at": "2025-06-03T10:01:29.047299+00:00"} {"global_step": 237555, "acc_step": 0, "speed/wps": 5528.706997202355, "speed/FLOPS": 244340550788612.34, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04675139859318733, "optim/lr": 5.129287486631329e-06, "optim/total_tokens": 1992755773440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2732771635055542, "created_at": "2025-06-03T10:01:32.014793+00:00"} {"global_step": 237556, "acc_step": 0, "speed/wps": 5528.457888137282, "speed/FLOPS": 244329541442991.9, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049551937729120255, "optim/lr": 5.125740261537004e-06, "optim/total_tokens": 1992764162048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.250658631324768, "created_at": "2025-06-03T10:01:34.983962+00:00"} {"global_step": 237557, "acc_step": 0, "speed/wps": 5520.578652542227, "speed/FLOPS": 243981319559274.25, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04728221148252487, "optim/lr": 5.122193036442457e-06, "optim/total_tokens": 1992772550656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2679457664489746, "created_at": "2025-06-03T10:01:37.959772+00:00"} {"global_step": 237558, "acc_step": 0, "speed/wps": 5524.348637210921, "speed/FLOPS": 244147933585099.7, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0468071848154068, "optim/lr": 5.118645811347911e-06, "optim/total_tokens": 1992780939264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2441699504852295, "created_at": "2025-06-03T10:01:40.929554+00:00"} {"global_step": 237559, "acc_step": 0, "speed/wps": 5524.436515208002, "speed/FLOPS": 244151817342770.3, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047807373106479645, "optim/lr": 5.115098586253364e-06, "optim/total_tokens": 1992789327872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.261046051979065, "created_at": "2025-06-03T10:01:43.904913+00:00"} {"global_step": 237560, "acc_step": 0, "speed/wps": 5519.162222872879, "speed/FLOPS": 243918720617833.34, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048489511013031006, "optim/lr": 5.111551361159039e-06, "optim/total_tokens": 1992797716480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2711228132247925, "created_at": "2025-06-03T10:01:46.877480+00:00"} {"global_step": 237561, "acc_step": 0, "speed/wps": 5521.6984328463395, "speed/FLOPS": 244030808117160.8, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.19 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.19, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04657164216041565, "optim/lr": 5.108004136064492e-06, "optim/total_tokens": 1992806105088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2589409351348877, "created_at": "2025-06-03T10:01:49.849267+00:00"} {"global_step": 237562, "acc_step": 0, "speed/wps": 5527.365462859891, "speed/FLOPS": 244281261837270.7, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046998683363199234, "optim/lr": 5.104456910969946e-06, "optim/total_tokens": 1992814493696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.268202781677246, "created_at": "2025-06-03T10:01:52.817956+00:00"} {"global_step": 237563, "acc_step": 0, "speed/wps": 5530.057044186205, "speed/FLOPS": 244400215955131.62, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04871363192796707, "optim/lr": 5.100909685875399e-06, "optim/total_tokens": 1992822882304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2621105909347534, "created_at": "2025-06-03T10:01:55.787393+00:00"} {"global_step": 237564, "acc_step": 0, "speed/wps": 5535.48137189916, "speed/FLOPS": 244639943475818.12, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04703088104724884, "optim/lr": 5.097362460781074e-06, "optim/total_tokens": 1992831270912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2649726867675781, "created_at": "2025-06-03T10:01:58.754812+00:00"} {"global_step": 237565, "acc_step": 0, "speed/wps": 5512.136594250271, "speed/FLOPS": 243608223793141.22, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04749284312129021, "optim/lr": 5.0938152356865275e-06, "optim/total_tokens": 1992839659520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2438608407974243, "created_at": "2025-06-03T10:02:01.733436+00:00"} {"global_step": 237566, "acc_step": 0, "speed/wps": 5523.899199614836, "speed/FLOPS": 244128070743782.9, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04815680906176567, "optim/lr": 5.090268010591981e-06, "optim/total_tokens": 1992848048128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.276613712310791, "created_at": "2025-06-03T10:02:04.707546+00:00"} {"global_step": 237567, "acc_step": 0, "speed/wps": 5527.6389415276635, "speed/FLOPS": 244293348194595.53, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04722967743873596, "optim/lr": 5.086720785497434e-06, "optim/total_tokens": 1992856436736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2631667852401733, "created_at": "2025-06-03T10:02:07.675596+00:00"} {"global_step": 237568, "acc_step": 0, "speed/wps": 5534.393685271615, "speed/FLOPS": 244591873294165.5, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.29, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.052773281931877136, "optim/lr": 5.0831735604031094e-06, "optim/total_tokens": 1992864825344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2606968879699707, "created_at": "2025-06-03T10:02:10.640270+00:00"} {"global_step": 237569, "acc_step": 0, "speed/wps": 5518.242709072871, "speed/FLOPS": 243878082814371.22, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04651418700814247, "optim/lr": 5.079626335308562e-06, "optim/total_tokens": 1992873213952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2637525796890259, "created_at": "2025-06-03T10:02:13.613692+00:00"} {"global_step": 237570, "acc_step": 0, "speed/wps": 5521.177417541859, "speed/FLOPS": 244007781907500.84, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04712370038032532, "optim/lr": 5.076079110214016e-06, "optim/total_tokens": 1992881602560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2627166509628296, "created_at": "2025-06-03T10:02:16.585047+00:00"} {"global_step": 237571, "acc_step": 0, "speed/wps": 5519.612251137941, "speed/FLOPS": 243938609563695.56, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0467272624373436, "optim/lr": 5.072531885119469e-06, "optim/total_tokens": 1992889991168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.259365439414978, "created_at": "2025-06-03T10:02:19.557600+00:00"} {"global_step": 237572, "acc_step": 0, "speed/wps": 5534.383515605438, "speed/FLOPS": 244591423846973.56, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04838979244232178, "optim/lr": 5.068984660025144e-06, "optim/total_tokens": 1992898379776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2759757041931152, "created_at": "2025-06-03T10:02:22.522247+00:00"} {"global_step": 237573, "acc_step": 0, "speed/wps": 5524.07142765265, "speed/FLOPS": 244135682341511.25, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04701812565326691, "optim/lr": 5.065437434930598e-06, "optim/total_tokens": 1992906768384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2726207971572876, "created_at": "2025-06-03T10:02:25.492719+00:00"} {"global_step": 237574, "acc_step": 0, "speed/wps": 5520.489753452747, "speed/FLOPS": 243977390674546.0, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04625197499990463, "optim/lr": 5.0618902098360505e-06, "optim/total_tokens": 1992915156992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2755534648895264, "created_at": "2025-06-03T10:02:28.467525+00:00"} {"global_step": 237575, "acc_step": 0, "speed/wps": 5525.793219739514, "speed/FLOPS": 244211776738819.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0475236177444458, "optim/lr": 5.058342984741504e-06, "optim/total_tokens": 1992923545600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2686611413955688, "created_at": "2025-06-03T10:02:31.438682+00:00"} {"global_step": 237576, "acc_step": 0, "speed/wps": 5513.024339027962, "speed/FLOPS": 243647457568425.47, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.18 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.18, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05271771922707558, "optim/lr": 5.05479575964718e-06, "optim/total_tokens": 1992931934208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2669963836669922, "created_at": "2025-06-03T10:02:34.419904+00:00"} {"global_step": 237577, "acc_step": 0, "speed/wps": 5520.21870956691, "speed/FLOPS": 243965411922120.38, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04987137019634247, "optim/lr": 5.051248534552632e-06, "optim/total_tokens": 1992940322816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.26323664188385, "created_at": "2025-06-03T10:02:37.392462+00:00"} {"global_step": 237578, "acc_step": 0, "speed/wps": 5520.391895221621, "speed/FLOPS": 243973065841614.06, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04682924225926399, "optim/lr": 5.047701309458086e-06, "optim/total_tokens": 1992948711424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.262444257736206, "created_at": "2025-06-03T10:02:40.365682+00:00"} {"global_step": 237579, "acc_step": 0, "speed/wps": 5535.31661661727, "speed/FLOPS": 244632662135652.56, "speed/curr_iter_time": 2.9589, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9589, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.27, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05303234979510307, "optim/lr": 5.0441540843637615e-06, "optim/total_tokens": 1992957100032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2517271041870117, "created_at": "2025-06-03T10:02:43.335842+00:00"} {"global_step": 237580, "acc_step": 0, "speed/wps": 5524.235979525881, "speed/FLOPS": 244142954692055.22, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04998502507805824, "optim/lr": 5.040606859269214e-06, "optim/total_tokens": 1992965488640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2640401124954224, "created_at": "2025-06-03T10:02:46.306430+00:00"} {"global_step": 237581, "acc_step": 0, "speed/wps": 5522.727719349409, "speed/FLOPS": 244076297312230.6, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0477287620306015, "optim/lr": 5.037059634174668e-06, "optim/total_tokens": 1992973877248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2611371278762817, "created_at": "2025-06-03T10:02:49.279019+00:00"} {"global_step": 237582, "acc_step": 0, "speed/wps": 5538.536981301545, "speed/FLOPS": 244774985771376.8, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.16, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047583866864442825, "optim/lr": 5.033512409080121e-06, "optim/total_tokens": 1992982265856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2579277753829956, "created_at": "2025-06-03T10:02:52.242279+00:00"} {"global_step": 237583, "acc_step": 0, "speed/wps": 5519.969970782276, "speed/FLOPS": 243954418941000.06, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04767121747136116, "optim/lr": 5.029965183985796e-06, "optim/total_tokens": 1992990654464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2676634788513184, "created_at": "2025-06-03T10:02:55.218780+00:00"} {"global_step": 237584, "acc_step": 0, "speed/wps": 5514.7174493427565, "speed/FLOPS": 243722284378215.22, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049435507506132126, "optim/lr": 5.02641795889125e-06, "optim/total_tokens": 1992999043072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2702901363372803, "created_at": "2025-06-03T10:02:58.196853+00:00"} {"global_step": 237585, "acc_step": 0, "speed/wps": 5513.861096044549, "speed/FLOPS": 243684437945647.97, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04663737863302231, "optim/lr": 5.0228707337967025e-06, "optim/total_tokens": 1993007431680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2606128454208374, "created_at": "2025-06-03T10:03:01.172435+00:00"} {"global_step": 237586, "acc_step": 0, "speed/wps": 5516.650394004294, "speed/FLOPS": 243807710638547.5, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.17 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.17, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049388352781534195, "optim/lr": 5.019323508702156e-06, "optim/total_tokens": 1993015820288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2575384378433228, "created_at": "2025-06-03T10:03:04.146359+00:00"} {"global_step": 237587, "acc_step": 0, "speed/wps": 5516.77052367446, "speed/FLOPS": 243813019755089.44, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04851711541414261, "optim/lr": 5.015776283607832e-06, "optim/total_tokens": 1993024208896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2596747875213623, "created_at": "2025-06-03T10:03:07.120529+00:00"} {"global_step": 237588, "acc_step": 0, "speed/wps": 5529.555215990854, "speed/FLOPS": 244378037717486.7, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04788447171449661, "optim/lr": 5.012229058513284e-06, "optim/total_tokens": 1993032597504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.259380578994751, "created_at": "2025-06-03T10:03:10.087692+00:00"} {"global_step": 237589, "acc_step": 0, "speed/wps": 5527.710027782492, "speed/FLOPS": 244296489843206.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047715555876493454, "optim/lr": 5.008681833418738e-06, "optim/total_tokens": 1993040986112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2608275413513184, "created_at": "2025-06-03T10:03:13.059275+00:00"} {"global_step": 237590, "acc_step": 0, "speed/wps": 5539.950092779834, "speed/FLOPS": 244837438065757.0, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.03, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04934432730078697, "optim/lr": 5.005134608324191e-06, "optim/total_tokens": 1993049374720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2525458335876465, "created_at": "2025-06-03T10:03:16.021070+00:00"} {"global_step": 237591, "acc_step": 0, "speed/wps": 5524.226145089604, "speed/FLOPS": 244142520060309.0, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049683503806591034, "optim/lr": 5.001587383229866e-06, "optim/total_tokens": 1993057763328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2651034593582153, "created_at": "2025-06-03T10:03:18.992432+00:00"} {"global_step": 237592, "acc_step": 0, "speed/wps": 5518.967346329395, "speed/FLOPS": 243910108072079.88, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046495817601680756, "optim/lr": 4.99804015813532e-06, "optim/total_tokens": 1993066151936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2503212690353394, "created_at": "2025-06-03T10:03:21.969598+00:00"} {"global_step": 237593, "acc_step": 0, "speed/wps": 5522.444820310789, "speed/FLOPS": 244063794622732.1, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04797294735908508, "optim/lr": 4.994492933040773e-06, "optim/total_tokens": 1993074540544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2584636211395264, "created_at": "2025-06-03T10:03:24.940671+00:00"} {"global_step": 237594, "acc_step": 0, "speed/wps": 5523.645768934379, "speed/FLOPS": 244116870404882.5, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04983464255928993, "optim/lr": 4.990945707946226e-06, "optim/total_tokens": 1993082929152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2671737670898438, "created_at": "2025-06-03T10:03:27.916430+00:00"} {"global_step": 237595, "acc_step": 0, "speed/wps": 5500.929100067079, "speed/FLOPS": 243112909915399.66, "speed/curr_iter_time": 2.9775, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9775, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048238955438137054, "optim/lr": 4.987398482851902e-06, "optim/total_tokens": 1993091317760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.281054139137268, "created_at": "2025-06-03T10:03:30.902907+00:00"} {"global_step": 237596, "acc_step": 0, "speed/wps": 5514.119228632023, "speed/FLOPS": 243695846084771.94, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.16 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.16, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046660955995321274, "optim/lr": 4.9838512577573545e-06, "optim/total_tokens": 1993099706368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2700951099395752, "created_at": "2025-06-03T10:03:33.878232+00:00"} {"global_step": 237597, "acc_step": 0, "speed/wps": 5529.99367391257, "speed/FLOPS": 244397415313395.44, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.4, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049555618315935135, "optim/lr": 4.980304032662808e-06, "optim/total_tokens": 1993108094976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2671332359313965, "created_at": "2025-06-03T10:03:36.846582+00:00"} {"global_step": 237598, "acc_step": 0, "speed/wps": 5534.878601127927, "speed/FLOPS": 244613304092990.12, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049622900784015656, "optim/lr": 4.976756807568261e-06, "optim/total_tokens": 1993116483584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.270182728767395, "created_at": "2025-06-03T10:03:39.814275+00:00"} {"global_step": 237599, "acc_step": 0, "speed/wps": 5530.999264773005, "speed/FLOPS": 244441857282346.06, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05055076628923416, "optim/lr": 4.9732095824739364e-06, "optim/total_tokens": 1993124872192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2561862468719482, "created_at": "2025-06-03T10:03:42.784258+00:00"} {"global_step": 237600, "acc_step": 0, "speed/wps": 5527.308102646645, "speed/FLOPS": 244278726809441.4, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046780023723840714, "optim/lr": 4.96966235737939e-06, "optim/total_tokens": 1993133260800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2520649433135986, "created_at": "2025-06-03T10:03:45.753244+00:00"} {"global_step": 237601, "acc_step": 0, "speed/wps": 244.93541778473056, "speed/FLOPS": 10824891772966.834, "speed/curr_iter_time": 2.8851, "speed/data_load_time": 0.0017, "speed/curr_step_time": 2.8851, "speed/est_time_elapsed": "7.93 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 190.42, "speed/est_time_elapsed_days": 7.93, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05144394934177399, "optim/lr": 4.966115132284843e-06, "optim/total_tokens": 1993141649408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.267529010772705, "created_at": "2025-06-03T10:04:52.651192+00:00"} {"global_step": 237602, "acc_step": 0, "speed/wps": 5612.440157769467, "speed/FLOPS": 248041127900510.75, "speed/curr_iter_time": 2.9166, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9166, "speed/est_time_elapsed": "8.02 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 192.5, "speed/est_time_elapsed_days": 8.02, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04975896328687668, "optim/lr": 4.962567907190296e-06, "optim/total_tokens": 1993150038016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2548127174377441, "created_at": "2025-06-03T10:04:55.578376+00:00"} {"global_step": 237603, "acc_step": 0, "speed/wps": 5582.417644860108, "speed/FLOPS": 246714286499068.6, "speed/curr_iter_time": 2.9338, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9338, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 193.63, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0465860441327095, "optim/lr": 4.959020682095972e-06, "optim/total_tokens": 1993158426624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.258837342262268, "created_at": "2025-06-03T10:04:58.522392+00:00"} {"global_step": 237604, "acc_step": 0, "speed/wps": 5558.020864334868, "speed/FLOPS": 245636073673895.8, "speed/curr_iter_time": 2.9467, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9467, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049088284373283386, "optim/lr": 4.955473457001425e-06, "optim/total_tokens": 1993166815232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2682225704193115, "created_at": "2025-06-03T10:05:01.479712+00:00"} {"global_step": 237605, "acc_step": 0, "speed/wps": 5515.646282882142, "speed/FLOPS": 243763334066455.03, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04707040265202522, "optim/lr": 4.951926231906878e-06, "optim/total_tokens": 1993175203840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2595134973526, "created_at": "2025-06-03T10:05:04.459727+00:00"} {"global_step": 237606, "acc_step": 0, "speed/wps": 5546.720339329804, "speed/FLOPS": 245136648310002.4, "speed/curr_iter_time": 2.9512, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9512, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 194.78, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04781854897737503, "optim/lr": 4.948379006812553e-06, "optim/total_tokens": 1993183592448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2642992734909058, "created_at": "2025-06-03T10:05:07.421868+00:00"} {"global_step": 237607, "acc_step": 0, "speed/wps": 5525.255300957012, "speed/FLOPS": 244188003481951.16, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.15 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.15, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046934545040130615, "optim/lr": 4.944831781718007e-06, "optim/total_tokens": 1993191981056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2534029483795166, "created_at": "2025-06-03T10:05:10.391226+00:00"} {"global_step": 237608, "acc_step": 0, "speed/wps": 5546.581018453844, "speed/FLOPS": 245130491040393.88, "speed/curr_iter_time": 2.9529, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9529, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 194.9, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04672830551862717, "optim/lr": 4.94128455662346e-06, "optim/total_tokens": 1993200369664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2741245031356812, "created_at": "2025-06-03T10:05:13.349433+00:00"} {"global_step": 237609, "acc_step": 0, "speed/wps": 5553.936288463814, "speed/FLOPS": 245455556327149.78, "speed/curr_iter_time": 2.9475, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9475, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 194.54, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047596681863069534, "optim/lr": 4.937737331528913e-06, "optim/total_tokens": 1993208758272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.265505313873291, "created_at": "2025-06-03T10:05:16.307525+00:00"} {"global_step": 237610, "acc_step": 0, "speed/wps": 5537.191427483159, "speed/FLOPS": 244715519179772.94, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04701213166117668, "optim/lr": 4.9341901064345885e-06, "optim/total_tokens": 1993217146880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2611693143844604, "created_at": "2025-06-03T10:05:19.271077+00:00"} {"global_step": 237611, "acc_step": 0, "speed/wps": 5522.20967763266, "speed/FLOPS": 244053402519928.16, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046758878976106644, "optim/lr": 4.930642881340042e-06, "optim/total_tokens": 1993225535488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2663445472717285, "created_at": "2025-06-03T10:05:22.246431+00:00"} {"global_step": 237612, "acc_step": 0, "speed/wps": 5538.335310364175, "speed/FLOPS": 244766072948190.5, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04719054698944092, "optim/lr": 4.927095656245495e-06, "optim/total_tokens": 1993233924096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2664361000061035, "created_at": "2025-06-03T10:05:25.212027+00:00"} {"global_step": 237613, "acc_step": 0, "speed/wps": 5527.859129794175, "speed/FLOPS": 244303079388949.6, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0464005284011364, "optim/lr": 4.9235484311509485e-06, "optim/total_tokens": 1993242312704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2651313543319702, "created_at": "2025-06-03T10:05:28.184306+00:00"} {"global_step": 237614, "acc_step": 0, "speed/wps": 5537.427832116118, "speed/FLOPS": 244725967054521.16, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04679994285106659, "optim/lr": 4.920001206056623e-06, "optim/total_tokens": 1993250701312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.256390929222107, "created_at": "2025-06-03T10:05:31.151902+00:00"} {"global_step": 237615, "acc_step": 0, "speed/wps": 5522.559733240332, "speed/FLOPS": 244068873186040.25, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04773564636707306, "optim/lr": 4.916453980962077e-06, "optim/total_tokens": 1993259089920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2781329154968262, "created_at": "2025-06-03T10:05:34.128438+00:00"} {"global_step": 237616, "acc_step": 0, "speed/wps": 5521.604141697656, "speed/FLOPS": 244026640931014.88, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046085141599178314, "optim/lr": 4.91290675586753e-06, "optim/total_tokens": 1993267478528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2613061666488647, "created_at": "2025-06-03T10:05:37.103712+00:00"} {"global_step": 237617, "acc_step": 0, "speed/wps": 5530.5464015818925, "speed/FLOPS": 244421843047262.8, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047120895236730576, "optim/lr": 4.909359530772983e-06, "optim/total_tokens": 1993275867136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 359, "loss/out": 1.2680010795593262, "created_at": "2025-06-03T10:05:40.070809+00:00"} {"global_step": 237618, "acc_step": 0, "speed/wps": 5548.017791532242, "speed/FLOPS": 245193989056387.78, "speed/curr_iter_time": 2.9522, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9522, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 194.86, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04978047311306, "optim/lr": 4.905812305678659e-06, "optim/total_tokens": 1993284255744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2825381755828857, "created_at": "2025-06-03T10:05:43.032051+00:00"} {"global_step": 237619, "acc_step": 0, "speed/wps": 5530.857129163808, "speed/FLOPS": 244435575615935.56, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.14 hours", "speed/est_time_elapsed_hrs": 195.37, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.14, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04768668860197067, "optim/lr": 4.902265080584111e-06, "optim/total_tokens": 1993292644352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2496683597564697, "created_at": "2025-06-03T10:05:45.998716+00:00"} {"global_step": 237620, "acc_step": 0, "speed/wps": 5538.817960481157, "speed/FLOPS": 244787403612933.84, "speed/curr_iter_time": 2.9571, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9571, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.19, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04631825536489487, "optim/lr": 4.898717855489565e-06, "optim/total_tokens": 1993301032960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2626383304595947, "created_at": "2025-06-03T10:05:48.966665+00:00"} {"global_step": 237621, "acc_step": 0, "speed/wps": 5542.150345943516, "speed/FLOPS": 244934677993675.12, "speed/curr_iter_time": 2.9553, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9553, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.07, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048622798174619675, "optim/lr": 4.895170630395019e-06, "optim/total_tokens": 1993309421568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.26980459690094, "created_at": "2025-06-03T10:05:51.929270+00:00"} {"global_step": 237622, "acc_step": 0, "speed/wps": 5534.933235209662, "speed/FLOPS": 244615718639760.22, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.33, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047088801860809326, "optim/lr": 4.891623405300693e-06, "optim/total_tokens": 1993317810176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.25533926486969, "created_at": "2025-06-03T10:05:54.894007+00:00"} {"global_step": 237623, "acc_step": 0, "speed/wps": 5541.022151262157, "speed/FLOPS": 244884817563382.9, "speed/curr_iter_time": 2.9546, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9546, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.02, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046277038753032684, "optim/lr": 4.888076180206147e-06, "optim/total_tokens": 1993326198784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2729288339614868, "created_at": "2025-06-03T10:05:57.857474+00:00"} {"global_step": 237624, "acc_step": 0, "speed/wps": 5528.712545946451, "speed/FLOPS": 244340796014700.38, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048701368272304535, "optim/lr": 4.8845289551116005e-06, "optim/total_tokens": 1993334587392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2776868343353271, "created_at": "2025-06-03T10:06:00.828973+00:00"} {"global_step": 237625, "acc_step": 0, "speed/wps": 5523.242215839803, "speed/FLOPS": 244099035423674.25, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04711717739701271, "optim/lr": 4.880981730017053e-06, "optim/total_tokens": 1993342976000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2621259689331055, "created_at": "2025-06-03T10:06:03.802104+00:00"} {"global_step": 237626, "acc_step": 0, "speed/wps": 5532.26078895747, "speed/FLOPS": 244497610194233.28, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046535395085811615, "optim/lr": 4.877434504922729e-06, "optim/total_tokens": 1993351364608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2549892663955688, "created_at": "2025-06-03T10:06:06.772683+00:00"} {"global_step": 237627, "acc_step": 0, "speed/wps": 5537.8306481451955, "speed/FLOPS": 244743769461207.0, "speed/curr_iter_time": 2.9576, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9576, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04685499146580696, "optim/lr": 4.8738872798281815e-06, "optim/total_tokens": 1993359753216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2559375762939453, "created_at": "2025-06-03T10:06:09.736267+00:00"} {"global_step": 237628, "acc_step": 0, "speed/wps": 5532.456235717996, "speed/FLOPS": 244506247940661.3, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04716214910149574, "optim/lr": 4.870340054733635e-06, "optim/total_tokens": 1993368141824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2604697942733765, "created_at": "2025-06-03T10:06:12.702168+00:00"} {"global_step": 237629, "acc_step": 0, "speed/wps": 5516.183823158545, "speed/FLOPS": 243787090595291.47, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04642089456319809, "optim/lr": 4.866792829639089e-06, "optim/total_tokens": 1993376530432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264689326286316, "created_at": "2025-06-03T10:06:15.676619+00:00"} {"global_step": 237630, "acc_step": 0, "speed/wps": 5531.076916989649, "speed/FLOPS": 244445289112861.66, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04788234084844589, "optim/lr": 4.8632456045447634e-06, "optim/total_tokens": 1993384919040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2557060718536377, "created_at": "2025-06-03T10:06:18.646175+00:00"} {"global_step": 237631, "acc_step": 0, "speed/wps": 5532.172434398089, "speed/FLOPS": 244493705374948.25, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04762500897049904, "optim/lr": 4.859698379450217e-06, "optim/total_tokens": 1993393307648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2598241567611694, "created_at": "2025-06-03T10:06:21.615151+00:00"} {"global_step": 237632, "acc_step": 0, "speed/wps": 5511.774519812768, "speed/FLOPS": 243592221956268.56, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04625339061021805, "optim/lr": 4.856151154355671e-06, "optim/total_tokens": 1993401696256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2646934986114502, "created_at": "2025-06-03T10:06:24.592686+00:00"} {"global_step": 237633, "acc_step": 0, "speed/wps": 5523.650256951448, "speed/FLOPS": 244117068752265.2, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.13 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.13, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048018522560596466, "optim/lr": 4.852603929261345e-06, "optim/total_tokens": 1993410084864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.268937587738037, "created_at": "2025-06-03T10:06:27.563460+00:00"} {"global_step": 237634, "acc_step": 0, "speed/wps": 5538.072538055232, "speed/FLOPS": 244754459757125.84, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0461956150829792, "optim/lr": 4.849056704166799e-06, "optim/total_tokens": 1993418473472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2757456302642822, "created_at": "2025-06-03T10:06:30.525952+00:00"} {"global_step": 237635, "acc_step": 0, "speed/wps": 5525.063081724832, "speed/FLOPS": 244179508375756.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04679407179355621, "optim/lr": 4.845509479072252e-06, "optim/total_tokens": 1993426862080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2633931636810303, "created_at": "2025-06-03T10:06:33.499985+00:00"} {"global_step": 237636, "acc_step": 0, "speed/wps": 5535.333934066517, "speed/FLOPS": 244633427478270.56, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0484653115272522, "optim/lr": 4.841962253977705e-06, "optim/total_tokens": 1993435250688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2408795356750488, "created_at": "2025-06-03T10:06:36.466494+00:00"} {"global_step": 237637, "acc_step": 0, "speed/wps": 5531.171122398898, "speed/FLOPS": 244449452509763.44, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04736677557229996, "optim/lr": 4.838415028883381e-06, "optim/total_tokens": 1993443639296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2714958190917969, "created_at": "2025-06-03T10:06:39.432799+00:00"} {"global_step": 237638, "acc_step": 0, "speed/wps": 5520.486172689544, "speed/FLOPS": 243977232423140.44, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048446036875247955, "optim/lr": 4.834867803788834e-06, "optim/total_tokens": 1993452027904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2562172412872314, "created_at": "2025-06-03T10:06:42.408141+00:00"} {"global_step": 237639, "acc_step": 0, "speed/wps": 5528.516318994604, "speed/FLOPS": 244332123787809.3, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046609457582235336, "optim/lr": 4.831320578694287e-06, "optim/total_tokens": 1993460416512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2559494972229004, "created_at": "2025-06-03T10:06:45.375958+00:00"} {"global_step": 237640, "acc_step": 0, "speed/wps": 5524.270066177666, "speed/FLOPS": 244144461147592.84, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047024521976709366, "optim/lr": 4.82777335359974e-06, "optim/total_tokens": 1993468805120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2609177827835083, "created_at": "2025-06-03T10:06:48.346233+00:00"} {"global_step": 237641, "acc_step": 0, "speed/wps": 5525.217340194115, "speed/FLOPS": 244186325810531.94, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04688311368227005, "optim/lr": 4.8242261285054155e-06, "optim/total_tokens": 1993477193728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2675126791000366, "created_at": "2025-06-03T10:06:51.320726+00:00"} {"global_step": 237642, "acc_step": 0, "speed/wps": 5521.294137083456, "speed/FLOPS": 244012940313814.7, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05189736932516098, "optim/lr": 4.820678903410869e-06, "optim/total_tokens": 1993485582336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2611947059631348, "created_at": "2025-06-03T10:06:54.294694+00:00"} {"global_step": 237643, "acc_step": 0, "speed/wps": 5529.969726500104, "speed/FLOPS": 244396356960338.4, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.42, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04734502360224724, "optim/lr": 4.817131678316322e-06, "optim/total_tokens": 1993493970944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.276424527168274, "created_at": "2025-06-03T10:06:57.262400+00:00"} {"global_step": 237644, "acc_step": 0, "speed/wps": 5526.716981961191, "speed/FLOPS": 244252602300774.28, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046984247863292694, "optim/lr": 4.8135844532217755e-06, "optim/total_tokens": 1993502359552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.262824535369873, "created_at": "2025-06-03T10:07:00.230959+00:00"} {"global_step": 237645, "acc_step": 0, "speed/wps": 5521.440798040024, "speed/FLOPS": 244019421977416.16, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04705221205949783, "optim/lr": 4.810037228127451e-06, "optim/total_tokens": 1993510748160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2624691724777222, "created_at": "2025-06-03T10:07:03.204439+00:00"} {"global_step": 237646, "acc_step": 0, "speed/wps": 5527.506056576245, "speed/FLOPS": 244287475359909.66, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047144901007413864, "optim/lr": 4.806490003032904e-06, "optim/total_tokens": 1993519136768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2577836513519287, "created_at": "2025-06-03T10:07:06.178266+00:00"} {"global_step": 237647, "acc_step": 0, "speed/wps": 5508.765300980746, "speed/FLOPS": 243459229886471.47, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.12 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.12, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04812205955386162, "optim/lr": 4.802942777938357e-06, "optim/total_tokens": 1993527525376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2454301118850708, "created_at": "2025-06-03T10:07:09.158946+00:00"} {"global_step": 237648, "acc_step": 0, "speed/wps": 5521.147090581, "speed/FLOPS": 244006441611058.38, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04752812907099724, "optim/lr": 4.79939555284381e-06, "optim/total_tokens": 1993535913984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2509028911590576, "created_at": "2025-06-03T10:07:12.130434+00:00"} {"global_step": 237649, "acc_step": 0, "speed/wps": 5521.531997562716, "speed/FLOPS": 244023452529517.7, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04690305143594742, "optim/lr": 4.795848327749486e-06, "optim/total_tokens": 1993544302592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2714385986328125, "created_at": "2025-06-03T10:07:15.101597+00:00"} {"global_step": 237650, "acc_step": 0, "speed/wps": 5523.433537542583, "speed/FLOPS": 244107490863663.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047278281301259995, "optim/lr": 4.792301102654939e-06, "optim/total_tokens": 1993552691200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2588772773742676, "created_at": "2025-06-03T10:07:18.072368+00:00"} {"global_step": 237651, "acc_step": 0, "speed/wps": 5532.561512751441, "speed/FLOPS": 244510900646682.9, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04718964174389839, "optim/lr": 4.788753877560392e-06, "optim/total_tokens": 1993561079808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2672897577285767, "created_at": "2025-06-03T10:07:21.042746+00:00"} {"global_step": 237652, "acc_step": 0, "speed/wps": 5522.902088052555, "speed/FLOPS": 244084003516409.72, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04671832174062729, "optim/lr": 4.785206652465846e-06, "optim/total_tokens": 1993569468416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2419534921646118, "created_at": "2025-06-03T10:07:24.014363+00:00"} {"global_step": 237653, "acc_step": 0, "speed/wps": 5531.890570871843, "speed/FLOPS": 244481248449796.5, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0470220223069191, "optim/lr": 4.781659427371521e-06, "optim/total_tokens": 1993577857024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2494187355041504, "created_at": "2025-06-03T10:07:26.983943+00:00"} {"global_step": 237654, "acc_step": 0, "speed/wps": 5532.54344881902, "speed/FLOPS": 244510102313329.47, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048063792288303375, "optim/lr": 4.778112202276974e-06, "optim/total_tokens": 1993586245632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2562450170516968, "created_at": "2025-06-03T10:07:29.949342+00:00"} {"global_step": 237655, "acc_step": 0, "speed/wps": 5520.258822792759, "speed/FLOPS": 243967184721384.8, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05033153295516968, "optim/lr": 4.7745649771824275e-06, "optim/total_tokens": 1993594634240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2857803106307983, "created_at": "2025-06-03T10:07:32.926416+00:00"} {"global_step": 237656, "acc_step": 0, "speed/wps": 5516.834531535771, "speed/FLOPS": 243815848574937.47, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04653051123023033, "optim/lr": 4.77101775208788e-06, "optim/total_tokens": 1993603022848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2614479064941406, "created_at": "2025-06-03T10:07:35.899892+00:00"} {"global_step": 237657, "acc_step": 0, "speed/wps": 5514.236064758577, "speed/FLOPS": 243701009643544.16, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04692452773451805, "optim/lr": 4.767470526993556e-06, "optim/total_tokens": 1993611411456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2728044986724854, "created_at": "2025-06-03T10:07:38.875428+00:00"} {"global_step": 237658, "acc_step": 0, "speed/wps": 5510.176455878438, "speed/FLOPS": 243521595710003.9, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046855080872774124, "optim/lr": 4.763923301899009e-06, "optim/total_tokens": 1993619800064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.242942214012146, "created_at": "2025-06-03T10:07:41.853613+00:00"} {"global_step": 237659, "acc_step": 0, "speed/wps": 5498.806896016777, "speed/FLOPS": 243019119358801.3, "speed/curr_iter_time": 2.9786, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9786, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "1.11 hours", "speed/est_time_elapsed_hrs": 196.64, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 1.11, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04689818248152733, "optim/lr": 4.760376076804462e-06, "optim/total_tokens": 1993628188672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2596172094345093, "created_at": "2025-06-03T10:07:44.842985+00:00"} {"global_step": 237660, "acc_step": 0, "speed/wps": 5515.637184129396, "speed/FLOPS": 243762931948155.28, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04815976321697235, "optim/lr": 4.756828851710138e-06, "optim/total_tokens": 1993636577280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2622261047363281, "created_at": "2025-06-03T10:07:47.820647+00:00"} {"global_step": 237661, "acc_step": 0, "speed/wps": 5531.619280801155, "speed/FLOPS": 244469258817260.56, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04709514230489731, "optim/lr": 4.753281626615591e-06, "optim/total_tokens": 1993644965888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2391468286514282, "created_at": "2025-06-03T10:07:50.787415+00:00"} {"global_step": 237662, "acc_step": 0, "speed/wps": 5519.909614775426, "speed/FLOPS": 243951751514427.34, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04729422926902771, "optim/lr": 4.749734401521044e-06, "optim/total_tokens": 1993653354496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2673999071121216, "created_at": "2025-06-03T10:07:53.759770+00:00"} {"global_step": 237663, "acc_step": 0, "speed/wps": 5521.772670647403, "speed/FLOPS": 244034089047984.3, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05008537322282791, "optim/lr": 4.746187176426498e-06, "optim/total_tokens": 1993661743104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2606775760650635, "created_at": "2025-06-03T10:07:56.733742+00:00"} {"global_step": 237664, "acc_step": 0, "speed/wps": 5513.229930848177, "speed/FLOPS": 243656543674564.66, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046624526381492615, "optim/lr": 4.742639951332172e-06, "optim/total_tokens": 1993670131712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2539937496185303, "created_at": "2025-06-03T10:07:59.713332+00:00"} {"global_step": 237665, "acc_step": 0, "speed/wps": 5519.75745629462, "speed/FLOPS": 243945026888393.44, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04724370315670967, "optim/lr": 4.739092726237626e-06, "optim/total_tokens": 1993678520320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2666648626327515, "created_at": "2025-06-03T10:08:02.692257+00:00"} {"global_step": 237666, "acc_step": 0, "speed/wps": 5504.119118961319, "speed/FLOPS": 243253892422528.2, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04770375415682793, "optim/lr": 4.7355455011430795e-06, "optim/total_tokens": 1993686908928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2588582038879395, "created_at": "2025-06-03T10:08:05.677408+00:00"} {"global_step": 237667, "acc_step": 0, "speed/wps": 5517.976935743022, "speed/FLOPS": 243866336993543.16, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04702039808034897, "optim/lr": 4.731998276048532e-06, "optim/total_tokens": 1993695297536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2596683502197266, "created_at": "2025-06-03T10:08:08.653777+00:00"} {"global_step": 237668, "acc_step": 0, "speed/wps": 5517.822671987917, "speed/FLOPS": 243859519325160.97, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.046696171164512634, "optim/lr": 4.728451050954208e-06, "optim/total_tokens": 1993703686144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2612260580062866, "created_at": "2025-06-03T10:08:11.631241+00:00"} {"global_step": 237669, "acc_step": 0, "speed/wps": 5514.639340889521, "speed/FLOPS": 243718832384377.5, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04696827381849289, "optim/lr": 4.7249038258596614e-06, "optim/total_tokens": 1993712074752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2450405359268188, "created_at": "2025-06-03T10:08:14.607018+00:00"} {"global_step": 237670, "acc_step": 0, "speed/wps": 5510.214971802625, "speed/FLOPS": 243523297916710.6, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04708387330174446, "optim/lr": 4.721356600765114e-06, "optim/total_tokens": 1993720463360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2441725730895996, "created_at": "2025-06-03T10:08:17.584800+00:00"} {"global_step": 237671, "acc_step": 0, "speed/wps": 5517.913954953558, "speed/FLOPS": 243863553565013.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04680212214589119, "optim/lr": 4.717809375670568e-06, "optim/total_tokens": 1993728851968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2462942600250244, "created_at": "2025-06-03T10:08:20.562101+00:00"} {"global_step": 237672, "acc_step": 0, "speed/wps": 5507.931528403061, "speed/FLOPS": 243422381406172.7, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.05014742538332939, "optim/lr": 4.7142621505762425e-06, "optim/total_tokens": 1993737240576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2482633590698242, "created_at": "2025-06-03T10:08:23.540910+00:00"} {"global_step": 237673, "acc_step": 0, "speed/wps": 5510.770933328696, "speed/FLOPS": 243547868570493.88, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.048019494861364365, "optim/lr": 4.710714925481696e-06, "optim/total_tokens": 1993745629184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2639496326446533, "created_at": "2025-06-03T10:08:26.518660+00:00"} {"global_step": 237674, "acc_step": 0, "speed/wps": 5506.633625199337, "speed/FLOPS": 243365020727838.94, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.1 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.1, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047224391251802444, "optim/lr": 4.70716770038715e-06, "optim/total_tokens": 1993754017792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2543435096740723, "created_at": "2025-06-03T10:08:29.500832+00:00"} {"global_step": 237675, "acc_step": 0, "speed/wps": 5509.489794723107, "speed/FLOPS": 243491248801588.66, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04775867611169815, "optim/lr": 4.7036204752926025e-06, "optim/total_tokens": 1993762406400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.270599603652954, "created_at": "2025-06-03T10:08:32.478634+00:00"} {"global_step": 237676, "acc_step": 0, "speed/wps": 5533.798088942559, "speed/FLOPS": 244565550984959.6, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04846324771642685, "optim/lr": 4.700073250198278e-06, "optim/total_tokens": 1993770795008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2750177383422852, "created_at": "2025-06-03T10:08:35.443726+00:00"} {"global_step": 237677, "acc_step": 0, "speed/wps": 5528.310493690112, "speed/FLOPS": 244323027362860.16, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 195.5, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0472496896982193, "optim/lr": 4.696526025103732e-06, "optim/total_tokens": 1993779183616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2390954494476318, "created_at": "2025-06-03T10:08:38.415495+00:00"} {"global_step": 237678, "acc_step": 0, "speed/wps": 5516.925822467529, "speed/FLOPS": 243819883166851.78, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04786469414830208, "optim/lr": 4.692978800009184e-06, "optim/total_tokens": 1993787572224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2569972276687622, "created_at": "2025-06-03T10:08:41.389933+00:00"} {"global_step": 237679, "acc_step": 0, "speed/wps": 5517.752148724151, "speed/FLOPS": 243856402557873.3, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047045692801475525, "optim/lr": 4.689431574914638e-06, "optim/total_tokens": 1993795960832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2477667331695557, "created_at": "2025-06-03T10:08:44.365810+00:00"} {"global_step": 237680, "acc_step": 0, "speed/wps": 5517.885334405435, "speed/FLOPS": 243862288683279.94, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04742131382226944, "optim/lr": 4.685884349820313e-06, "optim/total_tokens": 1993804349440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2685823440551758, "created_at": "2025-06-03T10:08:47.342951+00:00"} {"global_step": 237681, "acc_step": 0, "speed/wps": 5523.425033920188, "speed/FLOPS": 244107115047079.5, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04698897525668144, "optim/lr": 4.682337124725766e-06, "optim/total_tokens": 1993812738048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2617958784103394, "created_at": "2025-06-03T10:08:50.316309+00:00"} {"global_step": 237682, "acc_step": 0, "speed/wps": 5511.0017825429, "speed/FLOPS": 243558070924168.3, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04799070581793785, "optim/lr": 4.67878989963122e-06, "optim/total_tokens": 1993821126656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2736365795135498, "created_at": "2025-06-03T10:08:53.295844+00:00"} {"global_step": 237683, "acc_step": 0, "speed/wps": 5513.322323682512, "speed/FLOPS": 243660626964932.88, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04825755953788757, "optim/lr": 4.675242674536673e-06, "optim/total_tokens": 1993829515264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2627712488174438, "created_at": "2025-06-03T10:08:56.272812+00:00"} {"global_step": 237684, "acc_step": 0, "speed/wps": 5510.037222538307, "speed/FLOPS": 243515442309030.94, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047993335872888565, "optim/lr": 4.671695449442348e-06, "optim/total_tokens": 1993837903872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2527931928634644, "created_at": "2025-06-03T10:08:59.250784+00:00"} {"global_step": 237685, "acc_step": 0, "speed/wps": 5513.131387347059, "speed/FLOPS": 243652188556206.6, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.09 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.09, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04740096256136894, "optim/lr": 4.668148224347801e-06, "optim/total_tokens": 1993846292480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2710360288619995, "created_at": "2025-06-03T10:09:02.227477+00:00"} {"global_step": 237686, "acc_step": 0, "speed/wps": 5519.595816853137, "speed/FLOPS": 243937883252425.53, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.0485810786485672, "optim/lr": 4.6646009992532545e-06, "optim/total_tokens": 1993854681088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2506160736083984, "created_at": "2025-06-03T10:09:05.202455+00:00"} {"global_step": 237687, "acc_step": 0, "speed/wps": 5527.042169514082, "speed/FLOPS": 244266973926151.28, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04959864541888237, "optim/lr": 4.66105377415893e-06, "optim/total_tokens": 1993863069696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.272102952003479, "created_at": "2025-06-03T10:09:08.172395+00:00"} {"global_step": 237688, "acc_step": 0, "speed/wps": 5513.495842799776, "speed/FLOPS": 243668295621764.6, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.047603026032447815, "optim/lr": 4.657506549064383e-06, "optim/total_tokens": 1993871458304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2657976150512695, "created_at": "2025-06-03T10:09:11.148388+00:00"} {"global_step": 237689, "acc_step": 0, "speed/wps": 5515.321226232209, "speed/FLOPS": 243748968226318.72, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.049556914716959, "optim/lr": 4.653959323969836e-06, "optim/total_tokens": 1993879846912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2547484636306763, "created_at": "2025-06-03T10:09:14.126128+00:00"} {"global_step": 237690, "acc_step": 0, "speed/wps": 5515.780133906582, "speed/FLOPS": 243769249596623.6, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04918504133820534, "optim/lr": 4.65041209887529e-06, "optim/total_tokens": 1993888235520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2757439613342285, "created_at": "2025-06-03T10:09:17.104096+00:00"} {"global_step": 237691, "acc_step": 0, "speed/wps": 5505.508794671641, "speed/FLOPS": 243315308975919.34, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.05, "optim/grad_norm": 0.04717942699790001, "optim/lr": 4.646864873780965e-06, "optim/total_tokens": 1993896624128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2635926008224487, "created_at": "2025-06-03T10:09:20.088685+00:00"} {"global_step": 237692, "acc_step": 0, "speed/wps": 5516.780078999897, "speed/FLOPS": 243813442051565.2, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04605390876531601, "optim/lr": 4.643317648686418e-06, "optim/total_tokens": 1993905012736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2486968040466309, "created_at": "2025-06-03T10:09:23.064171+00:00"} {"global_step": 237693, "acc_step": 0, "speed/wps": 5537.684952934325, "speed/FLOPS": 244737330478622.25, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.2, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04741779342293739, "optim/lr": 4.639770423591871e-06, "optim/total_tokens": 1993913401344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2483779191970825, "created_at": "2025-06-03T10:09:26.030269+00:00"} {"global_step": 237694, "acc_step": 0, "speed/wps": 5516.230352371141, "speed/FLOPS": 243789146948330.1, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04704586789011955, "optim/lr": 4.636223198497325e-06, "optim/total_tokens": 1993921789952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2771292924880981, "created_at": "2025-06-03T10:09:29.004803+00:00"} {"global_step": 237695, "acc_step": 0, "speed/wps": 5517.231389465275, "speed/FLOPS": 243833387664118.53, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04696139693260193, "optim/lr": 4.632675973403e-06, "optim/total_tokens": 1993930178560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2484632730484009, "created_at": "2025-06-03T10:09:31.978281+00:00"} {"global_step": 237696, "acc_step": 0, "speed/wps": 5508.46906825068, "speed/FLOPS": 243446137916059.1, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.08 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.08, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047882866114377975, "optim/lr": 4.629128748308453e-06, "optim/total_tokens": 1993938567168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2747973203659058, "created_at": "2025-06-03T10:09:34.956807+00:00"} {"global_step": 237697, "acc_step": 0, "speed/wps": 5517.7222401151885, "speed/FLOPS": 243855080750443.3, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04681406542658806, "optim/lr": 4.6255815232139065e-06, "optim/total_tokens": 1993946955776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2583324909210205, "created_at": "2025-06-03T10:09:37.930945+00:00"} {"global_step": 237698, "acc_step": 0, "speed/wps": 5513.751159774259, "speed/FLOPS": 243679579325205.97, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048365700989961624, "optim/lr": 4.622034298119359e-06, "optim/total_tokens": 1993955344384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2785134315490723, "created_at": "2025-06-03T10:09:40.906695+00:00"} {"global_step": 237699, "acc_step": 0, "speed/wps": 5518.035858786647, "speed/FLOPS": 243868941090475.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04638984426856041, "optim/lr": 4.618487073025035e-06, "optim/total_tokens": 1993963732992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.255133032798767, "created_at": "2025-06-03T10:09:43.879875+00:00"} {"global_step": 237700, "acc_step": 0, "speed/wps": 5522.177107566694, "speed/FLOPS": 244051963089721.16, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04710962623357773, "optim/lr": 4.6149398479304884e-06, "optim/total_tokens": 1993972121600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2479255199432373, "created_at": "2025-06-03T10:09:46.854040+00:00"} {"global_step": 237701, "acc_step": 0, "speed/wps": 5524.756752469434, "speed/FLOPS": 244165970190602.72, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046687740832567215, "optim/lr": 4.611392622835941e-06, "optim/total_tokens": 1993980510208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2753479480743408, "created_at": "2025-06-03T10:09:49.823865+00:00"} {"global_step": 237702, "acc_step": 0, "speed/wps": 5518.727111190512, "speed/FLOPS": 243899490908576.2, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04706812649965286, "optim/lr": 4.607845397741395e-06, "optim/total_tokens": 1993988898816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2635284662246704, "created_at": "2025-06-03T10:09:52.796655+00:00"} {"global_step": 237703, "acc_step": 0, "speed/wps": 5531.621918078324, "speed/FLOPS": 244469375371412.62, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047462042421102524, "optim/lr": 4.60429817264707e-06, "optim/total_tokens": 1993997287424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2561396360397339, "created_at": "2025-06-03T10:09:55.762638+00:00"} {"global_step": 237704, "acc_step": 0, "speed/wps": 5525.44444444379, "speed/FLOPS": 244196362655942.66, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.050412677228450775, "optim/lr": 4.600750947552523e-06, "optim/total_tokens": 1994005676032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2555360794067383, "created_at": "2025-06-03T10:09:58.731752+00:00"} {"global_step": 237705, "acc_step": 0, "speed/wps": 5515.441654232771, "speed/FLOPS": 243754290527537.2, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04781675711274147, "optim/lr": 4.597203722457977e-06, "optim/total_tokens": 1994014064640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2562490701675415, "created_at": "2025-06-03T10:10:01.706300+00:00"} {"global_step": 237706, "acc_step": 0, "speed/wps": 5521.348192691778, "speed/FLOPS": 244015329295020.84, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0474245585501194, "optim/lr": 4.5936564973634295e-06, "optim/total_tokens": 1994022453248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2674121856689453, "created_at": "2025-06-03T10:10:04.678673+00:00"} {"global_step": 237707, "acc_step": 0, "speed/wps": 5517.867466562636, "speed/FLOPS": 243861499016084.12, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04854816198348999, "optim/lr": 4.590109272269105e-06, "optim/total_tokens": 1994030841856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2535656690597534, "created_at": "2025-06-03T10:10:07.653030+00:00"} {"global_step": 237708, "acc_step": 0, "speed/wps": 5514.006884074835, "speed/FLOPS": 243690881030375.84, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04776357486844063, "optim/lr": 4.586562047174559e-06, "optim/total_tokens": 1994039230464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2562839984893799, "created_at": "2025-06-03T10:10:10.628350+00:00"} {"global_step": 237709, "acc_step": 0, "speed/wps": 5513.161913983995, "speed/FLOPS": 243653537677309.7, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.07 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.07, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04849260300397873, "optim/lr": 4.583014822080011e-06, "optim/total_tokens": 1994047619072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2735481262207031, "created_at": "2025-06-03T10:10:13.610756+00:00"} {"global_step": 237710, "acc_step": 0, "speed/wps": 5525.1646395409925, "speed/FLOPS": 244183996711410.3, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05274904519319534, "optim/lr": 4.579467596985465e-06, "optim/total_tokens": 1994056007680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2569888830184937, "created_at": "2025-06-03T10:10:16.581295+00:00"} {"global_step": 237711, "acc_step": 0, "speed/wps": 5524.298082520712, "speed/FLOPS": 244145699326554.84, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048818618059158325, "optim/lr": 4.5759203718911405e-06, "optim/total_tokens": 1994064396288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2571083307266235, "created_at": "2025-06-03T10:10:19.551523+00:00"} {"global_step": 237712, "acc_step": 0, "speed/wps": 5514.519240920922, "speed/FLOPS": 243713524580492.8, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04785596579313278, "optim/lr": 4.572373146796593e-06, "optim/total_tokens": 1994072784896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2774968147277832, "created_at": "2025-06-03T10:10:22.527026+00:00"} {"global_step": 237713, "acc_step": 0, "speed/wps": 5520.347504408253, "speed/FLOPS": 243971103994876.0, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04764139652252197, "optim/lr": 4.568825921702047e-06, "optim/total_tokens": 1994081173504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2575974464416504, "created_at": "2025-06-03T10:10:25.500278+00:00"} {"global_step": 237714, "acc_step": 0, "speed/wps": 5516.162046115265, "speed/FLOPS": 243786128161443.5, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04785403981804848, "optim/lr": 4.565278696607722e-06, "optim/total_tokens": 1994089562112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.260518193244934, "created_at": "2025-06-03T10:10:28.478708+00:00"} {"global_step": 237715, "acc_step": 0, "speed/wps": 5530.922864573046, "speed/FLOPS": 244438480784559.56, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 195.54, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04870785027742386, "optim/lr": 4.561731471513175e-06, "optim/total_tokens": 1994097950720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2683186531066895, "created_at": "2025-06-03T10:10:31.446694+00:00"} {"global_step": 237716, "acc_step": 0, "speed/wps": 5509.906690796382, "speed/FLOPS": 243509673474159.88, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047274149954319, "optim/lr": 4.558184246418629e-06, "optim/total_tokens": 1994106339328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2782939672470093, "created_at": "2025-06-03T10:10:34.424030+00:00"} {"global_step": 237717, "acc_step": 0, "speed/wps": 5513.5596541666155, "speed/FLOPS": 243671115757562.7, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04736415669322014, "optim/lr": 4.5546370213240815e-06, "optim/total_tokens": 1994114727936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2609431743621826, "created_at": "2025-06-03T10:10:37.400887+00:00"} {"global_step": 237718, "acc_step": 0, "speed/wps": 5517.7086617621935, "speed/FLOPS": 243854480656741.25, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.06 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.06, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04708585888147354, "optim/lr": 4.551089796229757e-06, "optim/total_tokens": 1994123116544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.241974115371704, "created_at": "2025-06-03T10:10:40.374722+00:00"} {"global_step": 237719, "acc_step": 0, "speed/wps": 5531.841732337915, "speed/FLOPS": 244479090036575.2, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04870779812335968, "optim/lr": 4.547542571135211e-06, "optim/total_tokens": 1994131505152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2476989030838013, "created_at": "2025-06-03T10:10:43.342148+00:00"} {"global_step": 237720, "acc_step": 0, "speed/wps": 5527.752483621075, "speed/FLOPS": 244298366173963.2, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0477534681558609, "optim/lr": 4.543995346040663e-06, "optim/total_tokens": 1994139893760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2609360218048096, "created_at": "2025-06-03T10:10:46.315083+00:00"} {"global_step": 237721, "acc_step": 0, "speed/wps": 5522.989932604546, "speed/FLOPS": 244087885795978.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04833828657865524, "optim/lr": 4.540448120946117e-06, "optim/total_tokens": 1994148282368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.261521816253662, "created_at": "2025-06-03T10:10:49.286272+00:00"} {"global_step": 237722, "acc_step": 0, "speed/wps": 5521.623014660739, "speed/FLOPS": 244027475019382.53, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04674811661243439, "optim/lr": 4.5369008958517925e-06, "optim/total_tokens": 1994156670976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2536931037902832, "created_at": "2025-06-03T10:10:52.261166+00:00"} {"global_step": 237723, "acc_step": 0, "speed/wps": 5517.667948736409, "speed/FLOPS": 243852681349389.72, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.053055934607982635, "optim/lr": 4.533353670757245e-06, "optim/total_tokens": 1994165059584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2588529586791992, "created_at": "2025-06-03T10:10:55.237792+00:00"} {"global_step": 237724, "acc_step": 0, "speed/wps": 5521.03516511168, "speed/FLOPS": 244001495078200.88, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047205161303281784, "optim/lr": 4.529806445662699e-06, "optim/total_tokens": 1994173448192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.246687650680542, "created_at": "2025-06-03T10:10:58.212897+00:00"} {"global_step": 237725, "acc_step": 0, "speed/wps": 5511.137911208704, "speed/FLOPS": 243564087114427.2, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047161463648080826, "optim/lr": 4.526259220568152e-06, "optim/total_tokens": 1994181836800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2481238842010498, "created_at": "2025-06-03T10:11:01.193433+00:00"} {"global_step": 237726, "acc_step": 0, "speed/wps": 5525.4801500298645, "speed/FLOPS": 244197940660089.38, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04669417440891266, "optim/lr": 4.522711995473827e-06, "optim/total_tokens": 1994190225408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2625747919082642, "created_at": "2025-06-03T10:11:04.164848+00:00"} {"global_step": 237727, "acc_step": 0, "speed/wps": 5514.126358530239, "speed/FLOPS": 243696161189778.97, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04795920103788376, "optim/lr": 4.519164770379281e-06, "optim/total_tokens": 1994198614016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2652859687805176, "created_at": "2025-06-03T10:11:07.141705+00:00"} {"global_step": 237728, "acc_step": 0, "speed/wps": 5521.747735868648, "speed/FLOPS": 244032987058391.12, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04624016955494881, "optim/lr": 4.5156175452847335e-06, "optim/total_tokens": 1994207002624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2527955770492554, "created_at": "2025-06-03T10:11:10.113126+00:00"} {"global_step": 237729, "acc_step": 0, "speed/wps": 5523.820594535499, "speed/FLOPS": 244124596801613.47, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04656943306326866, "optim/lr": 4.512070320190187e-06, "optim/total_tokens": 1994215391232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.248807668685913, "created_at": "2025-06-03T10:11:13.083689+00:00"} {"global_step": 237730, "acc_step": 0, "speed/wps": 5514.5203247558175, "speed/FLOPS": 243713572480447.6, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04942871630191803, "optim/lr": 4.508523095095862e-06, "optim/total_tokens": 1994223779840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2631494998931885, "created_at": "2025-06-03T10:11:16.060435+00:00"} {"global_step": 237731, "acc_step": 0, "speed/wps": 5519.892556074989, "speed/FLOPS": 243950997607182.4, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0470353402197361, "optim/lr": 4.5049758700013154e-06, "optim/total_tokens": 1994232168448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2709614038467407, "created_at": "2025-06-03T10:11:19.036912+00:00"} {"global_step": 237732, "acc_step": 0, "speed/wps": 5509.6403967474425, "speed/FLOPS": 243497904640213.25, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.05 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.05, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04702018201351166, "optim/lr": 4.501428644906769e-06, "optim/total_tokens": 1994240557056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2628495693206787, "created_at": "2025-06-03T10:11:22.015239+00:00"} {"global_step": 237733, "acc_step": 0, "speed/wps": 5524.695789459696, "speed/FLOPS": 244163275937609.28, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046751588582992554, "optim/lr": 4.497881419812222e-06, "optim/total_tokens": 1994248945664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2404447793960571, "created_at": "2025-06-03T10:11:24.985309+00:00"} {"global_step": 237734, "acc_step": 0, "speed/wps": 5527.202572203303, "speed/FLOPS": 244274062903999.47, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04731952026486397, "optim/lr": 4.494334194717897e-06, "optim/total_tokens": 1994257334272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2606682777404785, "created_at": "2025-06-03T10:11:27.958742+00:00"} {"global_step": 237735, "acc_step": 0, "speed/wps": 5519.344458395557, "speed/FLOPS": 243926774495169.72, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05032414197921753, "optim/lr": 4.490786969623351e-06, "optim/total_tokens": 1994265722880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2656458616256714, "created_at": "2025-06-03T10:11:30.935269+00:00"} {"global_step": 237736, "acc_step": 0, "speed/wps": 5538.065007005886, "speed/FLOPS": 244754126923292.16, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04744267836213112, "optim/lr": 4.487239744528804e-06, "optim/total_tokens": 1994274111488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2732293605804443, "created_at": "2025-06-03T10:11:33.901096+00:00"} {"global_step": 237737, "acc_step": 0, "speed/wps": 5517.6708751462675, "speed/FLOPS": 243852810681726.75, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047148171812295914, "optim/lr": 4.483692519434257e-06, "optim/total_tokens": 1994282500096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2650233507156372, "created_at": "2025-06-03T10:11:36.879430+00:00"} {"global_step": 237738, "acc_step": 0, "speed/wps": 5524.7158720397765, "speed/FLOPS": 244164163484856.84, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04729075729846954, "optim/lr": 4.480145294339932e-06, "optim/total_tokens": 1994290888704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.27212393283844, "created_at": "2025-06-03T10:11:39.853641+00:00"} {"global_step": 237739, "acc_step": 0, "speed/wps": 5520.578356734112, "speed/FLOPS": 243981306486069.62, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047363441437482834, "optim/lr": 4.476598069245386e-06, "optim/total_tokens": 1994299277312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2780810594558716, "created_at": "2025-06-03T10:11:42.829012+00:00"} {"global_step": 237740, "acc_step": 0, "speed/wps": 5522.595913420202, "speed/FLOPS": 244070472164803.53, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04664120450615883, "optim/lr": 4.473050844150839e-06, "optim/total_tokens": 1994307665920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.260358452796936, "created_at": "2025-06-03T10:11:45.800407+00:00"} {"global_step": 237741, "acc_step": 0, "speed/wps": 5507.983382172208, "speed/FLOPS": 243424673077357.34, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 196.37, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04689878970384598, "optim/lr": 4.469503619056292e-06, "optim/total_tokens": 1994316054528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2532883882522583, "created_at": "2025-06-03T10:11:48.778910+00:00"} {"global_step": 237742, "acc_step": 0, "speed/wps": 5514.328439464102, "speed/FLOPS": 243705092132711.75, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.04 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.04, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04998156800866127, "optim/lr": 4.4659563939619675e-06, "optim/total_tokens": 1994324443136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2457983493804932, "created_at": "2025-06-03T10:11:51.754167+00:00"} {"global_step": 237743, "acc_step": 0, "speed/wps": 5528.8289674557345, "speed/FLOPS": 244345941249511.38, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04774004593491554, "optim/lr": 4.46240916886742e-06, "optim/total_tokens": 1994332831744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2581509351730347, "created_at": "2025-06-03T10:11:54.724280+00:00"} {"global_step": 237744, "acc_step": 0, "speed/wps": 5537.400478110365, "speed/FLOPS": 244724758147477.34, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.25, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04734645038843155, "optim/lr": 4.458861943772874e-06, "optim/total_tokens": 1994341220352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2745023965835571, "created_at": "2025-06-03T10:11:57.688162+00:00"} {"global_step": 237745, "acc_step": 0, "speed/wps": 5525.1720795824585, "speed/FLOPS": 244184325523161.53, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047677747905254364, "optim/lr": 4.455314718678549e-06, "optim/total_tokens": 1994349608960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.255592703819275, "created_at": "2025-06-03T10:12:00.657568+00:00"} {"global_step": 237746, "acc_step": 0, "speed/wps": 5518.505339218458, "speed/FLOPS": 243889689722543.25, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04820461943745613, "optim/lr": 4.451767493584002e-06, "optim/total_tokens": 1994357997568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.252550482749939, "created_at": "2025-06-03T10:12:03.634740+00:00"} {"global_step": 237747, "acc_step": 0, "speed/wps": 5515.580105985528, "speed/FLOPS": 243760409386348.72, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04707604646682739, "optim/lr": 4.448220268489456e-06, "optim/total_tokens": 1994366386176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2723002433776855, "created_at": "2025-06-03T10:12:06.612086+00:00"} {"global_step": 237748, "acc_step": 0, "speed/wps": 5513.5468980822625, "speed/FLOPS": 243670552003925.84, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04762177914381027, "optim/lr": 4.444673043394909e-06, "optim/total_tokens": 1994374774784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.267643690109253, "created_at": "2025-06-03T10:12:09.588046+00:00"} {"global_step": 237749, "acc_step": 0, "speed/wps": 5512.47035611671, "speed/FLOPS": 243622974359289.72, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048279665410518646, "optim/lr": 4.441125818300584e-06, "optim/total_tokens": 1994383163392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2491421699523926, "created_at": "2025-06-03T10:12:12.566834+00:00"} {"global_step": 237750, "acc_step": 0, "speed/wps": 5519.47927040966, "speed/FLOPS": 243932732496162.62, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04698167368769646, "optim/lr": 4.437578593206038e-06, "optim/total_tokens": 1994391552000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2640422582626343, "created_at": "2025-06-03T10:12:15.543422+00:00"} {"global_step": 237751, "acc_step": 0, "speed/wps": 5505.043470350113, "speed/FLOPS": 243294744022653.6, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04725256562232971, "optim/lr": 4.43403136811149e-06, "optim/total_tokens": 1994399940608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2644269466400146, "created_at": "2025-06-03T10:12:18.523659+00:00"} {"global_step": 237752, "acc_step": 0, "speed/wps": 5526.335784262491, "speed/FLOPS": 244235755313638.44, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04695306345820427, "optim/lr": 4.430484143016944e-06, "optim/total_tokens": 1994408329216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2577115297317505, "created_at": "2025-06-03T10:12:21.492839+00:00"} {"global_step": 237753, "acc_step": 0, "speed/wps": 5530.307875092681, "speed/FLOPS": 244411301397328.9, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.050104767084121704, "optim/lr": 4.4269369179226195e-06, "optim/total_tokens": 1994416717824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2565674781799316, "created_at": "2025-06-03T10:12:24.464161+00:00"} {"global_step": 237754, "acc_step": 0, "speed/wps": 5523.693109188377, "speed/FLOPS": 244118962601799.84, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046479444950819016, "optim/lr": 4.423389692828072e-06, "optim/total_tokens": 1994425106432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2539021968841553, "created_at": "2025-06-03T10:12:27.435087+00:00"} {"global_step": 237755, "acc_step": 0, "speed/wps": 5522.046649578774, "speed/FLOPS": 244046197514399.62, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04871530458331108, "optim/lr": 4.419842467733526e-06, "optim/total_tokens": 1994433495040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2582050561904907, "created_at": "2025-06-03T10:12:30.406381+00:00"} {"global_step": 237756, "acc_step": 0, "speed/wps": 5529.153914844696, "speed/FLOPS": 244360302260872.0, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047597602009773254, "optim/lr": 4.4162952426389795e-06, "optim/total_tokens": 1994441883648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2626547813415527, "created_at": "2025-06-03T10:12:33.373411+00:00"} {"global_step": 237757, "acc_step": 0, "speed/wps": 5503.834132992693, "speed/FLOPS": 243241297501405.34, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04763200506567955, "optim/lr": 4.412748017544654e-06, "optim/total_tokens": 1994450272256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2399308681488037, "created_at": "2025-06-03T10:12:36.356374+00:00"} {"global_step": 237758, "acc_step": 0, "speed/wps": 5510.449067746666, "speed/FLOPS": 243533643759225.53, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.03 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.03, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04656698554754257, "optim/lr": 4.409200792450108e-06, "optim/total_tokens": 1994458660864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2610687017440796, "created_at": "2025-06-03T10:12:39.337099+00:00"} {"global_step": 237759, "acc_step": 0, "speed/wps": 5515.563218427422, "speed/FLOPS": 243759663042718.8, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046779338270425797, "optim/lr": 4.4056535673555605e-06, "optim/total_tokens": 1994467049472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2680195569992065, "created_at": "2025-06-03T10:12:42.312275+00:00"} {"global_step": 237760, "acc_step": 0, "speed/wps": 5523.152797007688, "speed/FLOPS": 244095083568981.8, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046522289514541626, "optim/lr": 4.402106342261014e-06, "optim/total_tokens": 1994475438080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2446227073669434, "created_at": "2025-06-03T10:12:45.282999+00:00"} {"global_step": 237761, "acc_step": 0, "speed/wps": 5526.338628298756, "speed/FLOPS": 244235881005484.25, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04642563313245773, "optim/lr": 4.39855911716669e-06, "optim/total_tokens": 1994483826688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2507363557815552, "created_at": "2025-06-03T10:12:48.253135+00:00"} {"global_step": 237762, "acc_step": 0, "speed/wps": 5514.0209432588945, "speed/FLOPS": 243691502374349.8, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0465814583003521, "optim/lr": 4.3950118920721424e-06, "optim/total_tokens": 1994492215296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.272587537765503, "created_at": "2025-06-03T10:12:51.228864+00:00"} {"global_step": 237763, "acc_step": 0, "speed/wps": 5515.489264219876, "speed/FLOPS": 243756394645277.22, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04675126448273659, "optim/lr": 4.391464666977596e-06, "optim/total_tokens": 1994500603904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2821837663650513, "created_at": "2025-06-03T10:12:54.203830+00:00"} {"global_step": 237764, "acc_step": 0, "speed/wps": 5515.812877160121, "speed/FLOPS": 243770696680834.88, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04728923365473747, "optim/lr": 4.387917441883049e-06, "optim/total_tokens": 1994508992512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.273773431777954, "created_at": "2025-06-03T10:12:57.180892+00:00"} {"global_step": 237765, "acc_step": 0, "speed/wps": 5509.525714560456, "speed/FLOPS": 243492836274545.12, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04747714474797249, "optim/lr": 4.384370216788724e-06, "optim/total_tokens": 1994517381120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2705079317092896, "created_at": "2025-06-03T10:13:00.161435+00:00"} {"global_step": 237766, "acc_step": 0, "speed/wps": 5512.011383307959, "speed/FLOPS": 243602690110378.72, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0463845394551754, "optim/lr": 4.380822991694178e-06, "optim/total_tokens": 1994525769728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2666664123535156, "created_at": "2025-06-03T10:13:03.138552+00:00"} {"global_step": 237767, "acc_step": 0, "speed/wps": 5506.597929646608, "speed/FLOPS": 243363443167114.7, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.02 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.02, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047193460166454315, "optim/lr": 4.377275766599631e-06, "optim/total_tokens": 1994534158336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.25770103931427, "created_at": "2025-06-03T10:13:06.121525+00:00"} {"global_step": 237768, "acc_step": 0, "speed/wps": 5523.228765071066, "speed/FLOPS": 244098440968543.34, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046896692365407944, "optim/lr": 4.373728541505084e-06, "optim/total_tokens": 1994542546944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.25885808467865, "created_at": "2025-06-03T10:13:09.092547+00:00"} {"global_step": 237769, "acc_step": 0, "speed/wps": 5531.304477112523, "speed/FLOPS": 244455346105534.38, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04708748310804367, "optim/lr": 4.37018131641076e-06, "optim/total_tokens": 1994550935552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2430487871170044, "created_at": "2025-06-03T10:13:12.060471+00:00"} {"global_step": 237770, "acc_step": 0, "speed/wps": 5518.739686535502, "speed/FLOPS": 243900046674458.28, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048922572284936905, "optim/lr": 4.366634091316213e-06, "optim/total_tokens": 1994559324160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2535548210144043, "created_at": "2025-06-03T10:13:15.033852+00:00"} {"global_step": 237771, "acc_step": 0, "speed/wps": 5518.0697642516425, "speed/FLOPS": 243870439538484.78, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04790721833705902, "optim/lr": 4.363086866221666e-06, "optim/total_tokens": 1994567712768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2577052116394043, "created_at": "2025-06-03T10:13:18.007319+00:00"} {"global_step": 237772, "acc_step": 0, "speed/wps": 5521.518685530341, "speed/FLOPS": 244022864205823.84, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048184990882873535, "optim/lr": 4.359539641127342e-06, "optim/total_tokens": 1994576101376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2610687017440796, "created_at": "2025-06-03T10:13:20.978742+00:00"} {"global_step": 237773, "acc_step": 0, "speed/wps": 5519.5032958944, "speed/FLOPS": 243933794299614.56, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04771951958537102, "optim/lr": 4.3559924160327945e-06, "optim/total_tokens": 1994584489984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.275613784790039, "created_at": "2025-06-03T10:13:23.951612+00:00"} {"global_step": 237774, "acc_step": 0, "speed/wps": 5521.53118998332, "speed/FLOPS": 244023416838641.9, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05430331453680992, "optim/lr": 4.352445190938248e-06, "optim/total_tokens": 1994592878592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.264157772064209, "created_at": "2025-06-03T10:13:26.923047+00:00"} {"global_step": 237775, "acc_step": 0, "speed/wps": 5518.318852403382, "speed/FLOPS": 243881447959842.94, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04627154394984245, "optim/lr": 4.348897965843701e-06, "optim/total_tokens": 1994601267200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2615163326263428, "created_at": "2025-06-03T10:13:29.896551+00:00"} {"global_step": 237776, "acc_step": 0, "speed/wps": 5527.78040285677, "speed/FLOPS": 244299600061277.3, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047343604266643524, "optim/lr": 4.345350740749376e-06, "optim/total_tokens": 1994609655808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.27047860622406, "created_at": "2025-06-03T10:13:32.864678+00:00"} {"global_step": 237777, "acc_step": 0, "speed/wps": 5532.369038415117, "speed/FLOPS": 244502394266190.3, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.45, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04741889238357544, "optim/lr": 4.34180351565483e-06, "optim/total_tokens": 1994618044416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.255143165588379, "created_at": "2025-06-03T10:13:35.830463+00:00"} {"global_step": 237778, "acc_step": 0, "speed/wps": 5519.904320535388, "speed/FLOPS": 243951517536116.06, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046997688710689545, "optim/lr": 4.338256290560283e-06, "optim/total_tokens": 1994626433024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2449498176574707, "created_at": "2025-06-03T10:13:38.808156+00:00"} {"global_step": 237779, "acc_step": 0, "speed/wps": 5515.079841386432, "speed/FLOPS": 243738300251655.03, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047615110874176025, "optim/lr": 4.334709065465736e-06, "optim/total_tokens": 1994634821632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2573271989822388, "created_at": "2025-06-03T10:13:41.785041+00:00"} {"global_step": 237780, "acc_step": 0, "speed/wps": 5512.660775076217, "speed/FLOPS": 243631389902647.34, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047208793461322784, "optim/lr": 4.331161840371412e-06, "optim/total_tokens": 1994643210240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2582957744598389, "created_at": "2025-06-03T10:13:44.763218+00:00"} {"global_step": 237781, "acc_step": 0, "speed/wps": 5512.0809330622715, "speed/FLOPS": 243605763853531.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.01 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.01, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05025532469153404, "optim/lr": 4.327614615276865e-06, "optim/total_tokens": 1994651598848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2584424018859863, "created_at": "2025-06-03T10:13:47.744369+00:00"} {"global_step": 237782, "acc_step": 0, "speed/wps": 5514.562693613202, "speed/FLOPS": 243715444967080.53, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04789792746305466, "optim/lr": 4.324067390182318e-06, "optim/total_tokens": 1994659987456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2544649839401245, "created_at": "2025-06-03T10:13:50.719494+00:00"} {"global_step": 237783, "acc_step": 0, "speed/wps": 5520.509264103093, "speed/FLOPS": 243978252945426.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04742293804883957, "optim/lr": 4.320520165087771e-06, "optim/total_tokens": 1994668376064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2696363925933838, "created_at": "2025-06-03T10:13:53.691567+00:00"} {"global_step": 237784, "acc_step": 0, "speed/wps": 5516.319394546776, "speed/FLOPS": 243793082156734.0, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046567097306251526, "optim/lr": 4.3169729399934465e-06, "optim/total_tokens": 1994676764672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2634488344192505, "created_at": "2025-06-03T10:13:56.665577+00:00"} {"global_step": 237785, "acc_step": 0, "speed/wps": 5513.094214537155, "speed/FLOPS": 243650545708276.53, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04756264016032219, "optim/lr": 4.3134257148989e-06, "optim/total_tokens": 1994685153280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2614820003509521, "created_at": "2025-06-03T10:13:59.642567+00:00"} {"global_step": 237786, "acc_step": 0, "speed/wps": 5528.257532930389, "speed/FLOPS": 244320686768358.16, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04742656275629997, "optim/lr": 4.309878489804353e-06, "optim/total_tokens": 1994693541888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2541064023971558, "created_at": "2025-06-03T10:14:02.613447+00:00"} {"global_step": 237787, "acc_step": 0, "speed/wps": 5530.4862361189, "speed/FLOPS": 244419184041753.3, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0486108735203743, "optim/lr": 4.3063312647098065e-06, "optim/total_tokens": 1994701930496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2659912109375, "created_at": "2025-06-03T10:14:05.580303+00:00"} {"global_step": 237788, "acc_step": 0, "speed/wps": 5524.545864817441, "speed/FLOPS": 244156650035805.47, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04860691353678703, "optim/lr": 4.302784039615481e-06, "optim/total_tokens": 1994710319104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2568689584732056, "created_at": "2025-06-03T10:14:08.555752+00:00"} {"global_step": 237789, "acc_step": 0, "speed/wps": 5516.889334192254, "speed/FLOPS": 243818270571848.56, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047452282160520554, "optim/lr": 4.299236814520935e-06, "optim/total_tokens": 1994718707712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2715080976486206, "created_at": "2025-06-03T10:14:11.530412+00:00"} {"global_step": 237790, "acc_step": 0, "speed/wps": 5526.918707521558, "speed/FLOPS": 244261517538017.47, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04690907895565033, "optim/lr": 4.295689589426388e-06, "optim/total_tokens": 1994727096320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2440671920776367, "created_at": "2025-06-03T10:14:14.498879+00:00"} {"global_step": 237791, "acc_step": 0, "speed/wps": 5505.914567795142, "speed/FLOPS": 243333242071042.94, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04685730114579201, "optim/lr": 4.292142364331841e-06, "optim/total_tokens": 1994735484928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2670282125473022, "created_at": "2025-06-03T10:14:17.478874+00:00"} {"global_step": 237792, "acc_step": 0, "speed/wps": 5516.576769160298, "speed/FLOPS": 243804456797288.97, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047627877444028854, "optim/lr": 4.288595139237517e-06, "optim/total_tokens": 1994743873536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2537906169891357, "created_at": "2025-06-03T10:14:20.453118+00:00"} {"global_step": 237793, "acc_step": 0, "speed/wps": 5507.3369577770145, "speed/FLOPS": 243396104427789.78, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04730032756924629, "optim/lr": 4.28504791414297e-06, "optim/total_tokens": 1994752262144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2674272060394287, "created_at": "2025-06-03T10:14:23.432230+00:00"} {"global_step": 237794, "acc_step": 0, "speed/wps": 5515.837398213084, "speed/FLOPS": 243771780385865.72, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04734712839126587, "optim/lr": 4.281500689048423e-06, "optim/total_tokens": 1994760650752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2649142742156982, "created_at": "2025-06-03T10:14:26.412186+00:00"} {"global_step": 237795, "acc_step": 0, "speed/wps": 5509.097895171221, "speed/FLOPS": 243473928847319.06, "speed/curr_iter_time": 2.973, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.973, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046389345079660416, "optim/lr": 4.277953463953877e-06, "optim/total_tokens": 1994769039360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2571340799331665, "created_at": "2025-06-03T10:14:29.390311+00:00"} {"global_step": 237796, "acc_step": 0, "speed/wps": 5518.527094086436, "speed/FLOPS": 243890651176356.34, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04666442796587944, "optim/lr": 4.274406238859551e-06, "optim/total_tokens": 1994777427968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2319812774658203, "created_at": "2025-06-03T10:14:32.365222+00:00"} {"global_step": 237797, "acc_step": 0, "speed/wps": 5527.672105796157, "speed/FLOPS": 244294813885512.8, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04773390293121338, "optim/lr": 4.270859013765005e-06, "optim/total_tokens": 1994785816576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2820502519607544, "created_at": "2025-06-03T10:14:35.338110+00:00"} {"global_step": 237798, "acc_step": 0, "speed/wps": 5478.641459112806, "speed/FLOPS": 242127910263708.66, "speed/curr_iter_time": 2.9881, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9881, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "1.0 hours", "speed/est_time_elapsed_hrs": 197.38, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 1.0, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048141442239284515, "optim/lr": 4.2673117886704585e-06, "optim/total_tokens": 1994794205184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2704415321350098, "created_at": "2025-06-03T10:14:38.337336+00:00"} {"global_step": 237799, "acc_step": 0, "speed/wps": 5505.250513166548, "speed/FLOPS": 243303894255398.8, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047374047338962555, "optim/lr": 4.263764563576133e-06, "optim/total_tokens": 1994802593792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2581292390823364, "created_at": "2025-06-03T10:14:41.323416+00:00"} {"global_step": 237800, "acc_step": 0, "speed/wps": 5506.596160329245, "speed/FLOPS": 243363364972343.47, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04999587684869766, "optim/lr": 4.260217338481587e-06, "optim/total_tokens": 1994810982400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.245476245880127, "created_at": "2025-06-03T10:14:44.305916+00:00"} {"global_step": 237801, "acc_step": 0, "speed/wps": 5515.22583133186, "speed/FLOPS": 243744752259998.66, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048019059002399445, "optim/lr": 4.2566701133870404e-06, "optim/total_tokens": 1994819371008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2466124296188354, "created_at": "2025-06-03T10:14:47.283582+00:00"} {"global_step": 237802, "acc_step": 0, "speed/wps": 5516.979891192661, "speed/FLOPS": 243822272727753.8, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047484107315540314, "optim/lr": 4.253122888292493e-06, "optim/total_tokens": 1994827759616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2534133195877075, "created_at": "2025-06-03T10:14:50.257601+00:00"} {"global_step": 237803, "acc_step": 0, "speed/wps": 5526.055743270057, "speed/FLOPS": 244223378935152.6, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0480361208319664, "optim/lr": 4.249575663198169e-06, "optim/total_tokens": 1994836148224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2697079181671143, "created_at": "2025-06-03T10:14:53.228546+00:00"} {"global_step": 237804, "acc_step": 0, "speed/wps": 5518.88698399402, "speed/FLOPS": 243906556468188.03, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046403203159570694, "optim/lr": 4.2460284381036215e-06, "optim/total_tokens": 1994844536832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2777340412139893, "created_at": "2025-06-03T10:14:56.205091+00:00"} {"global_step": 237805, "acc_step": 0, "speed/wps": 5514.465888940179, "speed/FLOPS": 243711166696024.16, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.99 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.99, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046774547547101974, "optim/lr": 4.242481213009075e-06, "optim/total_tokens": 1994852925440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2641249895095825, "created_at": "2025-06-03T10:14:59.186835+00:00"} {"global_step": 237806, "acc_step": 0, "speed/wps": 5518.5639892078, "speed/FLOPS": 243892281751874.28, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04697723314166069, "optim/lr": 4.238933987914529e-06, "optim/total_tokens": 1994861314048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2687400579452515, "created_at": "2025-06-03T10:15:02.163710+00:00"} {"global_step": 237807, "acc_step": 0, "speed/wps": 5516.314889029176, "speed/FLOPS": 243792883035917.4, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04696100205183029, "optim/lr": 4.235386762820203e-06, "optim/total_tokens": 1994869702656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2704663276672363, "created_at": "2025-06-03T10:15:05.142015+00:00"} {"global_step": 237808, "acc_step": 0, "speed/wps": 5487.387312795564, "speed/FLOPS": 242514432231149.3, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04661012068390846, "optim/lr": 4.231839537725657e-06, "optim/total_tokens": 1994878091264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2737404108047485, "created_at": "2025-06-03T10:15:08.135144+00:00"} {"global_step": 237809, "acc_step": 0, "speed/wps": 5526.227973880329, "speed/FLOPS": 244230990646570.44, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04699893668293953, "optim/lr": 4.22829231263111e-06, "optim/total_tokens": 1994886479872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.255876898765564, "created_at": "2025-06-03T10:15:11.104526+00:00"} {"global_step": 237810, "acc_step": 0, "speed/wps": 5521.903797285249, "speed/FLOPS": 244039884174210.16, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04752722010016441, "optim/lr": 4.224745087536563e-06, "optim/total_tokens": 1994894868480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2536417245864868, "created_at": "2025-06-03T10:15:14.076279+00:00"} {"global_step": 237811, "acc_step": 0, "speed/wps": 5528.369244134856, "speed/FLOPS": 244325623831805.8, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04636885225772858, "optim/lr": 4.221197862442239e-06, "optim/total_tokens": 1994903257088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2537403106689453, "created_at": "2025-06-03T10:15:17.047164+00:00"} {"global_step": 237812, "acc_step": 0, "speed/wps": 5520.221303939173, "speed/FLOPS": 243965526580095.2, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04721260815858841, "optim/lr": 4.217650637347692e-06, "optim/total_tokens": 1994911645696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2527626752853394, "created_at": "2025-06-03T10:15:20.020029+00:00"} {"global_step": 237813, "acc_step": 0, "speed/wps": 5512.600699719993, "speed/FLOPS": 243628734879395.78, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047352712601423264, "optim/lr": 4.214103412253145e-06, "optim/total_tokens": 1994920034304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.268630862236023, "created_at": "2025-06-03T10:15:22.996404+00:00"} {"global_step": 237814, "acc_step": 0, "speed/wps": 5518.587014340173, "speed/FLOPS": 243893299344871.88, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04703200235962868, "optim/lr": 4.210556187158599e-06, "optim/total_tokens": 1994928422912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2548965215682983, "created_at": "2025-06-03T10:15:25.975032+00:00"} {"global_step": 237815, "acc_step": 0, "speed/wps": 5525.520408310565, "speed/FLOPS": 244199719870035.75, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04744391888380051, "optim/lr": 4.2070089620642735e-06, "optim/total_tokens": 1994936811520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.27892005443573, "created_at": "2025-06-03T10:15:28.949307+00:00"} {"global_step": 237816, "acc_step": 0, "speed/wps": 5516.024120330388, "speed/FLOPS": 243780032547720.1, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047254081815481186, "optim/lr": 4.203461736969727e-06, "optim/total_tokens": 1994945200128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2617703676223755, "created_at": "2025-06-03T10:15:31.927523+00:00"} {"global_step": 237817, "acc_step": 0, "speed/wps": 5514.3711856453865, "speed/FLOPS": 243706981295129.72, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04758622497320175, "optim/lr": 4.19991451187518e-06, "optim/total_tokens": 1994953588736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2638161182403564, "created_at": "2025-06-03T10:15:34.909041+00:00"} {"global_step": 237818, "acc_step": 0, "speed/wps": 5524.08894671115, "speed/FLOPS": 244136456594226.28, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04809817671775818, "optim/lr": 4.1963672867806335e-06, "optim/total_tokens": 1994961977344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.280104398727417, "created_at": "2025-06-03T10:15:37.882017+00:00"} {"global_step": 237819, "acc_step": 0, "speed/wps": 5507.191704112252, "speed/FLOPS": 243389684959282.97, "speed/curr_iter_time": 2.9739, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9739, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.98 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.98, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046509016305208206, "optim/lr": 4.192820061686309e-06, "optim/total_tokens": 1994970365952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2584441900253296, "created_at": "2025-06-03T10:15:40.861306+00:00"} {"global_step": 237820, "acc_step": 0, "speed/wps": 5534.251547074937, "speed/FLOPS": 244585591513401.56, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 195.51, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04771484434604645, "optim/lr": 4.189272836591762e-06, "optim/total_tokens": 1994978754560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2547589540481567, "created_at": "2025-06-03T10:15:43.825746+00:00"} {"global_step": 237821, "acc_step": 0, "speed/wps": 5517.64126896875, "speed/FLOPS": 243851502240218.62, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04633335396647453, "optim/lr": 4.185725611497215e-06, "optim/total_tokens": 1994987143168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2563501596450806, "created_at": "2025-06-03T10:15:46.799267+00:00"} {"global_step": 237822, "acc_step": 0, "speed/wps": 5517.742359425258, "speed/FLOPS": 243855969920968.4, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04788694530725479, "optim/lr": 4.182178386402669e-06, "optim/total_tokens": 1994995531776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2774732112884521, "created_at": "2025-06-03T10:15:49.776166+00:00"} {"global_step": 237823, "acc_step": 0, "speed/wps": 5524.69772874524, "speed/FLOPS": 244163361644104.16, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04708259180188179, "optim/lr": 4.178631161308344e-06, "optim/total_tokens": 1995003920384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2709052562713623, "created_at": "2025-06-03T10:15:52.748073+00:00"} {"global_step": 237824, "acc_step": 0, "speed/wps": 5511.183987587544, "speed/FLOPS": 243566123454531.6, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04725570231676102, "optim/lr": 4.175083936213797e-06, "optim/total_tokens": 1995012308992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2620209455490112, "created_at": "2025-06-03T10:15:55.726479+00:00"} {"global_step": 237825, "acc_step": 0, "speed/wps": 5511.571934018818, "speed/FLOPS": 243583268701104.06, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04716800898313522, "optim/lr": 4.17153671111925e-06, "optim/total_tokens": 1995020697600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2612807750701904, "created_at": "2025-06-03T10:15:58.708617+00:00"} {"global_step": 237826, "acc_step": 0, "speed/wps": 5503.615356886056, "speed/FLOPS": 243231628717289.62, "speed/curr_iter_time": 2.976, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.976, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04800746217370033, "optim/lr": 4.1679894860249256e-06, "optim/total_tokens": 1995029086208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2540735006332397, "created_at": "2025-06-03T10:16:01.689999+00:00"} {"global_step": 237827, "acc_step": 0, "speed/wps": 5516.686818570252, "speed/FLOPS": 243809320417925.03, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04702909663319588, "optim/lr": 4.164442260930379e-06, "optim/total_tokens": 1995037474816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2718753814697266, "created_at": "2025-06-03T10:16:04.665142+00:00"} {"global_step": 237828, "acc_step": 0, "speed/wps": 5516.087670692581, "speed/FLOPS": 243782841148448.8, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.97 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.97, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04935918375849724, "optim/lr": 4.160895035835832e-06, "optim/total_tokens": 1995045863424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2707570791244507, "created_at": "2025-06-03T10:16:07.643784+00:00"} {"global_step": 237829, "acc_step": 0, "speed/wps": 5522.439255969866, "speed/FLOPS": 244063548707344.22, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04659077152609825, "optim/lr": 4.1573478107412855e-06, "optim/total_tokens": 1995054252032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2672510147094727, "created_at": "2025-06-03T10:16:10.617640+00:00"} {"global_step": 237830, "acc_step": 0, "speed/wps": 5525.238100741911, "speed/FLOPS": 244187243320482.38, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04745526239275932, "optim/lr": 4.153800585646961e-06, "optim/total_tokens": 1995062640640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.25523042678833, "created_at": "2025-06-03T10:16:13.591351+00:00"} {"global_step": 237831, "acc_step": 0, "speed/wps": 5518.05721575833, "speed/FLOPS": 243869884959309.4, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047864146530628204, "optim/lr": 4.150253360552414e-06, "optim/total_tokens": 1995071029248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2662804126739502, "created_at": "2025-06-03T10:16:16.565064+00:00"} {"global_step": 237832, "acc_step": 0, "speed/wps": 5512.796677782561, "speed/FLOPS": 243637396106654.66, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047479547560214996, "optim/lr": 4.1467061354578674e-06, "optim/total_tokens": 1995079417856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.252034306526184, "created_at": "2025-06-03T10:16:19.541491+00:00"} {"global_step": 237833, "acc_step": 0, "speed/wps": 5523.576774665286, "speed/FLOPS": 244113821211333.3, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04670070484280586, "optim/lr": 4.14315891036332e-06, "optim/total_tokens": 1995087806464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2587954998016357, "created_at": "2025-06-03T10:16:22.515032+00:00"} {"global_step": 237834, "acc_step": 0, "speed/wps": 5511.376831232001, "speed/FLOPS": 243574646156553.34, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04789399355649948, "optim/lr": 4.139611685268996e-06, "optim/total_tokens": 1995096195072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2642794847488403, "created_at": "2025-06-03T10:16:25.497834+00:00"} {"global_step": 237835, "acc_step": 0, "speed/wps": 5512.277799084474, "speed/FLOPS": 243614464324061.16, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047779764980077744, "optim/lr": 4.136064460174449e-06, "optim/total_tokens": 1995104583680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2600691318511963, "created_at": "2025-06-03T10:16:28.474816+00:00"} {"global_step": 237836, "acc_step": 0, "speed/wps": 5534.992927139472, "speed/FLOPS": 244618356717526.84, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.49, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04652756080031395, "optim/lr": 4.132517235079902e-06, "optim/total_tokens": 1995112972288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2703579664230347, "created_at": "2025-06-03T10:16:31.439060+00:00"} {"global_step": 237837, "acc_step": 0, "speed/wps": 5527.94691801745, "speed/FLOPS": 244306959179077.5, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04637354239821434, "optim/lr": 4.128970009985356e-06, "optim/total_tokens": 1995121360896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2775299549102783, "created_at": "2025-06-03T10:16:34.409708+00:00"} {"global_step": 237838, "acc_step": 0, "speed/wps": 5537.500790961274, "speed/FLOPS": 244729191462039.8, "speed/curr_iter_time": 2.9562, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9562, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.3, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04653912037611008, "optim/lr": 4.125422784891031e-06, "optim/total_tokens": 1995129749504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2657740116119385, "created_at": "2025-06-03T10:16:37.376165+00:00"} {"global_step": 237839, "acc_step": 0, "speed/wps": 5518.9200874765875, "speed/FLOPS": 243908019472678.53, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04763076826930046, "optim/lr": 4.121875559796484e-06, "optim/total_tokens": 1995138138112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2689018249511719, "created_at": "2025-06-03T10:16:40.353443+00:00"} {"global_step": 237840, "acc_step": 0, "speed/wps": 5523.200375914234, "speed/FLOPS": 244097186313120.25, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047268956899642944, "optim/lr": 4.118328334701938e-06, "optim/total_tokens": 1995146526720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2772384881973267, "created_at": "2025-06-03T10:16:43.329065+00:00"} {"global_step": 237841, "acc_step": 0, "speed/wps": 5513.200689356059, "speed/FLOPS": 243655251350284.56, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04695337638258934, "optim/lr": 4.11478110960739e-06, "optim/total_tokens": 1995154915328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2681617736816406, "created_at": "2025-06-03T10:16:46.305292+00:00"} {"global_step": 237842, "acc_step": 0, "speed/wps": 5510.693318983354, "speed/FLOPS": 243544438413696.0, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.96 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.96, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04685935005545616, "optim/lr": 4.111233884513066e-06, "optim/total_tokens": 1995163303936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2632108926773071, "created_at": "2025-06-03T10:16:49.282444+00:00"} {"global_step": 237843, "acc_step": 0, "speed/wps": 5521.281313127638, "speed/FLOPS": 244012373560606.47, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04732467606663704, "optim/lr": 4.1076866594185195e-06, "optim/total_tokens": 1995171692544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.27242112159729, "created_at": "2025-06-03T10:16:52.257911+00:00"} {"global_step": 237844, "acc_step": 0, "speed/wps": 5530.83073814923, "speed/FLOPS": 244434409268172.62, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.049601614475250244, "optim/lr": 4.104139434323972e-06, "optim/total_tokens": 1995180081152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2738369703292847, "created_at": "2025-06-03T10:16:55.227729+00:00"} {"global_step": 237845, "acc_step": 0, "speed/wps": 5530.070353092985, "speed/FLOPS": 244400804140690.16, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04844030365347862, "optim/lr": 4.100592209229426e-06, "optim/total_tokens": 1995188469760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2694625854492188, "created_at": "2025-06-03T10:16:58.194754+00:00"} {"global_step": 237846, "acc_step": 0, "speed/wps": 5534.440011176865, "speed/FLOPS": 244593920662060.03, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04908789321780205, "optim/lr": 4.097044984135101e-06, "optim/total_tokens": 1995196858368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2467151880264282, "created_at": "2025-06-03T10:17:01.162528+00:00"} {"global_step": 237847, "acc_step": 0, "speed/wps": 5527.108023085596, "speed/FLOPS": 244269884316943.06, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047689151018857956, "optim/lr": 4.093497759040554e-06, "optim/total_tokens": 1995205246976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2534470558166504, "created_at": "2025-06-03T10:17:04.131255+00:00"} {"global_step": 237848, "acc_step": 0, "speed/wps": 5515.47779135344, "speed/FLOPS": 243755887603304.2, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04799922928214073, "optim/lr": 4.089950533946008e-06, "optim/total_tokens": 1995213635584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.279693603515625, "created_at": "2025-06-03T10:17:07.106532+00:00"} {"global_step": 237849, "acc_step": 0, "speed/wps": 5515.299273579862, "speed/FLOPS": 243747998031448.84, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04969055578112602, "optim/lr": 4.0864033088514605e-06, "optim/total_tokens": 1995222024192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2716249227523804, "created_at": "2025-06-03T10:17:10.083518+00:00"} {"global_step": 237850, "acc_step": 0, "speed/wps": 5516.5238076627575, "speed/FLOPS": 243802116170179.22, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04732687398791313, "optim/lr": 4.082856083757136e-06, "optim/total_tokens": 1995230412800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2504864931106567, "created_at": "2025-06-03T10:17:13.060584+00:00"} {"global_step": 237851, "acc_step": 0, "speed/wps": 5516.554211865643, "speed/FLOPS": 243803459880323.94, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.049783673137426376, "optim/lr": 4.07930885866259e-06, "optim/total_tokens": 1995238801408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2731566429138184, "created_at": "2025-06-03T10:17:16.035618+00:00"} {"global_step": 237852, "acc_step": 0, "speed/wps": 5517.111863903757, "speed/FLOPS": 243828105246086.7, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.051237016916275024, "optim/lr": 4.075761633568042e-06, "optim/total_tokens": 1995247190016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2556301355361938, "created_at": "2025-06-03T10:17:19.011177+00:00"} {"global_step": 237853, "acc_step": 0, "speed/wps": 5520.495781601003, "speed/FLOPS": 243977657087844.06, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.95 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.95, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04749372601509094, "optim/lr": 4.072214408473718e-06, "optim/total_tokens": 1995255578624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2581939697265625, "created_at": "2025-06-03T10:17:21.986815+00:00"} {"global_step": 237854, "acc_step": 0, "speed/wps": 5522.831697130017, "speed/FLOPS": 244080892597926.94, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047498106956481934, "optim/lr": 4.068667183379171e-06, "optim/total_tokens": 1995263967232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2675087451934814, "created_at": "2025-06-03T10:17:24.962970+00:00"} {"global_step": 237855, "acc_step": 0, "speed/wps": 5518.071791920435, "speed/FLOPS": 243870529151066.88, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05156476050615311, "optim/lr": 4.065119958284624e-06, "optim/total_tokens": 1995272355840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2668042182922363, "created_at": "2025-06-03T10:17:27.936225+00:00"} {"global_step": 237856, "acc_step": 0, "speed/wps": 5525.956111521597, "speed/FLOPS": 244218975721832.22, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047851189970970154, "optim/lr": 4.061572733190078e-06, "optim/total_tokens": 1995280744448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.25432550907135, "created_at": "2025-06-03T10:17:30.905251+00:00"} {"global_step": 237857, "acc_step": 0, "speed/wps": 5525.742642077796, "speed/FLOPS": 244209541465051.8, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046355895698070526, "optim/lr": 4.0580255080957526e-06, "optim/total_tokens": 1995289133056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2658054828643799, "created_at": "2025-06-03T10:17:33.874736+00:00"} {"global_step": 237858, "acc_step": 0, "speed/wps": 5522.616023212074, "speed/FLOPS": 244071360914673.03, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047011926770210266, "optim/lr": 4.054478283001206e-06, "optim/total_tokens": 1995297521664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2629427909851074, "created_at": "2025-06-03T10:17:36.846827+00:00"} {"global_step": 237859, "acc_step": 0, "speed/wps": 5517.991581577657, "speed/FLOPS": 243866984264469.8, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04978116601705551, "optim/lr": 4.05093105790666e-06, "optim/total_tokens": 1995305910272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2507309913635254, "created_at": "2025-06-03T10:17:39.820809+00:00"} {"global_step": 237860, "acc_step": 0, "speed/wps": 5529.888270780357, "speed/FLOPS": 244392757034453.75, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04857613518834114, "optim/lr": 4.0473838328121125e-06, "optim/total_tokens": 1995314298880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2696561813354492, "created_at": "2025-06-03T10:17:42.791720+00:00"} {"global_step": 237861, "acc_step": 0, "speed/wps": 5524.106417311421, "speed/FLOPS": 244137228705335.62, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0465659461915493, "optim/lr": 4.043836607717788e-06, "optim/total_tokens": 1995322687488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2556419372558594, "created_at": "2025-06-03T10:17:45.767500+00:00"} {"global_step": 237862, "acc_step": 0, "speed/wps": 5521.180671705892, "speed/FLOPS": 244007925724894.78, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047446973621845245, "optim/lr": 4.040289382623241e-06, "optim/total_tokens": 1995331076096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2616838216781616, "created_at": "2025-06-03T10:17:48.740578+00:00"} {"global_step": 237863, "acc_step": 0, "speed/wps": 5528.248023362799, "speed/FLOPS": 244320266494145.06, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04811779409646988, "optim/lr": 4.0367421575286944e-06, "optim/total_tokens": 1995339464704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2712379693984985, "created_at": "2025-06-03T10:17:51.712098+00:00"} {"global_step": 237864, "acc_step": 0, "speed/wps": 5527.807848188465, "speed/FLOPS": 244300813004460.28, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047914471477270126, "optim/lr": 4.033194932434148e-06, "optim/total_tokens": 1995347853312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.269241452217102, "created_at": "2025-06-03T10:17:54.680511+00:00"} {"global_step": 237865, "acc_step": 0, "speed/wps": 5520.169122925127, "speed/FLOPS": 243963220446361.03, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046966541558504105, "optim/lr": 4.029647707339823e-06, "optim/total_tokens": 1995356241920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.255910038948059, "created_at": "2025-06-03T10:17:57.652372+00:00"} {"global_step": 237866, "acc_step": 0, "speed/wps": 5522.881737339374, "speed/FLOPS": 244083104119051.5, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04798438772559166, "optim/lr": 4.026100482245276e-06, "optim/total_tokens": 1995364630528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2635000944137573, "created_at": "2025-06-03T10:18:00.623471+00:00"} {"global_step": 237867, "acc_step": 0, "speed/wps": 5520.33670508876, "speed/FLOPS": 243970626720230.3, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.05072619765996933, "optim/lr": 4.02255325715073e-06, "optim/total_tokens": 1995373019136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2649214267730713, "created_at": "2025-06-03T10:18:03.595395+00:00"} {"global_step": 237868, "acc_step": 0, "speed/wps": 5505.389362128893, "speed/FLOPS": 243310030668841.0, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.94 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.94, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04792099818587303, "optim/lr": 4.019006032056183e-06, "optim/total_tokens": 1995381407744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2594163417816162, "created_at": "2025-06-03T10:18:06.580321+00:00"} {"global_step": 237869, "acc_step": 0, "speed/wps": 5517.385051290879, "speed/FLOPS": 243840178730297.7, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0477915033698082, "optim/lr": 4.015458806961858e-06, "optim/total_tokens": 1995389796352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2644137144088745, "created_at": "2025-06-03T10:18:09.554241+00:00"} {"global_step": 237870, "acc_step": 0, "speed/wps": 5541.053127606507, "speed/FLOPS": 244886186559251.84, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.31, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04821662977337837, "optim/lr": 4.011911581867311e-06, "optim/total_tokens": 1995398184960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.241985559463501, "created_at": "2025-06-03T10:18:12.515064+00:00"} {"global_step": 237871, "acc_step": 0, "speed/wps": 5539.009282825628, "speed/FLOPS": 244795859081282.97, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.38, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047573335468769073, "optim/lr": 4.0083643567727646e-06, "optim/total_tokens": 1995406573568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.270035982131958, "created_at": "2025-06-03T10:18:15.477055+00:00"} {"global_step": 237872, "acc_step": 0, "speed/wps": 5518.133324545044, "speed/FLOPS": 243873248578122.06, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04668351635336876, "optim/lr": 4.004817131678218e-06, "optim/total_tokens": 1995414962176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2656580209732056, "created_at": "2025-06-03T10:18:18.450690+00:00"} {"global_step": 237873, "acc_step": 0, "speed/wps": 5536.4094240134045, "speed/FLOPS": 244680958629066.4, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04680100455880165, "optim/lr": 4.001269906583893e-06, "optim/total_tokens": 1995423350784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.277034044265747, "created_at": "2025-06-03T10:18:21.419756+00:00"} {"global_step": 237874, "acc_step": 0, "speed/wps": 5515.232691334245, "speed/FLOPS": 243745055436991.4, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047463513910770416, "optim/lr": 3.9977226814893465e-06, "optim/total_tokens": 1995431739392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2729861736297607, "created_at": "2025-06-03T10:18:24.394976+00:00"} {"global_step": 237875, "acc_step": 0, "speed/wps": 5528.741771079602, "speed/FLOPS": 244342087615997.8, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04685194417834282, "optim/lr": 3.994175456394799e-06, "optim/total_tokens": 1995440128000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2519313097000122, "created_at": "2025-06-03T10:18:27.362974+00:00"} {"global_step": 237876, "acc_step": 0, "speed/wps": 5508.830276835668, "speed/FLOPS": 243462101486682.44, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04761428385972977, "optim/lr": 3.990628231300253e-06, "optim/total_tokens": 1995448516608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.251783847808838, "created_at": "2025-06-03T10:18:30.341777+00:00"} {"global_step": 237877, "acc_step": 0, "speed/wps": 5503.041706697858, "speed/FLOPS": 243206276315179.1, "speed/curr_iter_time": 2.9762, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9762, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.93 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.93, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04649290814995766, "optim/lr": 3.987081006205928e-06, "optim/total_tokens": 1995456905216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2538824081420898, "created_at": "2025-06-03T10:18:33.324758+00:00"} {"global_step": 237878, "acc_step": 0, "speed/wps": 5534.133077388048, "speed/FLOPS": 244580355759623.9, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.47, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04728846997022629, "optim/lr": 3.983533781111381e-06, "optim/total_tokens": 1995465293824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.268376111984253, "created_at": "2025-06-03T10:18:36.293049+00:00"} {"global_step": 237879, "acc_step": 0, "speed/wps": 5528.925335697761, "speed/FLOPS": 244350200232551.56, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048156023025512695, "optim/lr": 3.979986556016835e-06, "optim/total_tokens": 1995473682432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2680838108062744, "created_at": "2025-06-03T10:18:39.260424+00:00"} {"global_step": 237880, "acc_step": 0, "speed/wps": 5522.1229910922075, "speed/FLOPS": 244049571418542.1, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04926212131977081, "optim/lr": 3.97643933092251e-06, "optim/total_tokens": 1995482071040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2513476610183716, "created_at": "2025-06-03T10:18:42.236371+00:00"} {"global_step": 237881, "acc_step": 0, "speed/wps": 5524.60513859694, "speed/FLOPS": 244159269633468.66, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046869050711393356, "optim/lr": 3.972892105827963e-06, "optim/total_tokens": 1995490459648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.264788031578064, "created_at": "2025-06-03T10:18:45.207576+00:00"} {"global_step": 237882, "acc_step": 0, "speed/wps": 5530.516959161121, "speed/FLOPS": 244420541842964.7, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04661067575216293, "optim/lr": 3.969344880733417e-06, "optim/total_tokens": 1995498848256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2668330669403076, "created_at": "2025-06-03T10:18:48.179889+00:00"} {"global_step": 237883, "acc_step": 0, "speed/wps": 5522.355577678437, "speed/FLOPS": 244059850555167.38, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04728197678923607, "optim/lr": 3.965797655638869e-06, "optim/total_tokens": 1995507236864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.269152045249939, "created_at": "2025-06-03T10:18:51.153958+00:00"} {"global_step": 237884, "acc_step": 0, "speed/wps": 5514.151697666236, "speed/FLOPS": 243697281049892.6, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04666893184185028, "optim/lr": 3.962250430544545e-06, "optim/total_tokens": 1995515625472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2590957880020142, "created_at": "2025-06-03T10:18:54.129611+00:00"} {"global_step": 237885, "acc_step": 0, "speed/wps": 5500.454198920023, "speed/FLOPS": 243091921715464.22, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04870803281664848, "optim/lr": 3.9587032054499985e-06, "optim/total_tokens": 1995524014080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2534517049789429, "created_at": "2025-06-03T10:18:57.117739+00:00"} {"global_step": 237886, "acc_step": 0, "speed/wps": 5508.722600266773, "speed/FLOPS": 243457342733475.9, "speed/curr_iter_time": 2.9732, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9732, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047842301428318024, "optim/lr": 3.955155980355451e-06, "optim/total_tokens": 1995532402688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2660059928894043, "created_at": "2025-06-03T10:19:00.096600+00:00"} {"global_step": 237887, "acc_step": 0, "speed/wps": 5510.687545261171, "speed/FLOPS": 243544183244728.1, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04673674702644348, "optim/lr": 3.951608755260905e-06, "optim/total_tokens": 1995540791296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2679308652877808, "created_at": "2025-06-03T10:19:03.074219+00:00"} {"global_step": 237888, "acc_step": 0, "speed/wps": 5528.815329170809, "speed/FLOPS": 244345338507124.72, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048471599817276, "optim/lr": 3.94806153016658e-06, "optim/total_tokens": 1995549179904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2535597085952759, "created_at": "2025-06-03T10:19:06.043887+00:00"} {"global_step": 237889, "acc_step": 0, "speed/wps": 5519.832308275134, "speed/FLOPS": 243948334962804.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.92 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.92, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046897392719984055, "optim/lr": 3.944514305072033e-06, "optim/total_tokens": 1995557568512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.270585060119629, "created_at": "2025-06-03T10:19:09.017118+00:00"} {"global_step": 237890, "acc_step": 0, "speed/wps": 5526.161619636798, "speed/FLOPS": 244228058128638.16, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04698991775512695, "optim/lr": 3.940967079977487e-06, "optim/total_tokens": 1995565957120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.275094747543335, "created_at": "2025-06-03T10:19:11.990192+00:00"} {"global_step": 237891, "acc_step": 0, "speed/wps": 5519.491912390613, "speed/FLOPS": 243933291207013.22, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04932273551821709, "optim/lr": 3.9374198548829395e-06, "optim/total_tokens": 1995574345728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2682709693908691, "created_at": "2025-06-03T10:19:14.964110+00:00"} {"global_step": 237892, "acc_step": 0, "speed/wps": 5529.139315700845, "speed/FLOPS": 244359657053438.97, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047328490763902664, "optim/lr": 3.933872629788615e-06, "optim/total_tokens": 1995582734336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2441500425338745, "created_at": "2025-06-03T10:19:17.933066+00:00"} {"global_step": 237893, "acc_step": 0, "speed/wps": 5521.076473216658, "speed/FLOPS": 244003320685006.88, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04835471883416176, "optim/lr": 3.930325404694069e-06, "optim/total_tokens": 1995591122944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2555674314498901, "created_at": "2025-06-03T10:19:20.907290+00:00"} {"global_step": 237894, "acc_step": 0, "speed/wps": 5526.216550035923, "speed/FLOPS": 244230485771120.25, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.050398822873830795, "optim/lr": 3.926778179599521e-06, "optim/total_tokens": 1995599511552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2533891201019287, "created_at": "2025-06-03T10:19:23.876604+00:00"} {"global_step": 237895, "acc_step": 0, "speed/wps": 5521.471900263607, "speed/FLOPS": 244020796536502.9, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04700043052434921, "optim/lr": 3.923230954504975e-06, "optim/total_tokens": 1995607900160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.255110740661621, "created_at": "2025-06-03T10:19:26.848038+00:00"} {"global_step": 237896, "acc_step": 0, "speed/wps": 5527.257169032543, "speed/FLOPS": 244276475804399.97, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0472668781876564, "optim/lr": 3.9196837294106506e-06, "optim/total_tokens": 1995616288768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.261157751083374, "created_at": "2025-06-03T10:19:29.816152+00:00"} {"global_step": 237897, "acc_step": 0, "speed/wps": 5525.869348110218, "speed/FLOPS": 244215141223144.62, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04722113907337189, "optim/lr": 3.916136504316103e-06, "optim/total_tokens": 1995624677376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2524501085281372, "created_at": "2025-06-03T10:19:32.788850+00:00"} {"global_step": 237898, "acc_step": 0, "speed/wps": 5535.002358920882, "speed/FLOPS": 244618773553988.94, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04722015559673309, "optim/lr": 3.912589279221557e-06, "optim/total_tokens": 1995633065984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2702776193618774, "created_at": "2025-06-03T10:19:35.756442+00:00"} {"global_step": 237899, "acc_step": 0, "speed/wps": 5529.647803976147, "speed/FLOPS": 244382129632528.38, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046979211270809174, "optim/lr": 3.90904205412701e-06, "optim/total_tokens": 1995641454592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2717961072921753, "created_at": "2025-06-03T10:19:38.724868+00:00"} {"global_step": 237900, "acc_step": 0, "speed/wps": 5515.147415844093, "speed/FLOPS": 243741286696806.22, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04692044481635094, "optim/lr": 3.905494829032685e-06, "optim/total_tokens": 1995649843200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.259209156036377, "created_at": "2025-06-03T10:19:41.699954+00:00"} {"global_step": 237901, "acc_step": 0, "speed/wps": 5519.0838495112675, "speed/FLOPS": 243915256916401.3, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.91 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.91, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04831220582127571, "optim/lr": 3.901947603938139e-06, "optim/total_tokens": 1995658231808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2529714107513428, "created_at": "2025-06-03T10:19:44.676381+00:00"} {"global_step": 237902, "acc_step": 0, "speed/wps": 5526.901948406144, "speed/FLOPS": 244260776870897.1, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046756312251091, "optim/lr": 3.8984003788435916e-06, "optim/total_tokens": 1995666620416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2673264741897583, "created_at": "2025-06-03T10:19:47.647671+00:00"} {"global_step": 237903, "acc_step": 0, "speed/wps": 5520.82308186975, "speed/FLOPS": 243992122084448.03, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04880787059664726, "optim/lr": 3.894853153749045e-06, "optim/total_tokens": 1995675009024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.257559061050415, "created_at": "2025-06-03T10:19:50.620635+00:00"} {"global_step": 237904, "acc_step": 0, "speed/wps": 5525.055940000246, "speed/FLOPS": 244179192748084.0, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.061915308237075806, "optim/lr": 3.891305928654721e-06, "optim/total_tokens": 1995683397632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2635371685028076, "created_at": "2025-06-03T10:19:53.591213+00:00"} {"global_step": 237905, "acc_step": 0, "speed/wps": 5518.064469213211, "speed/FLOPS": 243870205524888.56, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04694441705942154, "optim/lr": 3.8877587035601735e-06, "optim/total_tokens": 1995691786240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2733609676361084, "created_at": "2025-06-03T10:19:56.564445+00:00"} {"global_step": 237906, "acc_step": 0, "speed/wps": 5533.532379038385, "speed/FLOPS": 244553807967221.7, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 195.6, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04696165770292282, "optim/lr": 3.884211478465627e-06, "optim/total_tokens": 1995700174848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2729026079177856, "created_at": "2025-06-03T10:19:59.529980+00:00"} {"global_step": 237907, "acc_step": 0, "speed/wps": 5524.402927860948, "speed/FLOPS": 244150332953946.16, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047040171921253204, "optim/lr": 3.880664253371302e-06, "optim/total_tokens": 1995708563456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.269392967224121, "created_at": "2025-06-03T10:20:02.499658+00:00"} {"global_step": 237908, "acc_step": 0, "speed/wps": 5514.71306053747, "speed/FLOPS": 243722090415485.47, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.049640756100416183, "optim/lr": 3.877117028276755e-06, "optim/total_tokens": 1995716952064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2615976333618164, "created_at": "2025-06-03T10:20:05.479153+00:00"} {"global_step": 237909, "acc_step": 0, "speed/wps": 5510.764875907125, "speed/FLOPS": 243547600863465.16, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04957932233810425, "optim/lr": 3.873569803182209e-06, "optim/total_tokens": 1995725340672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2625724077224731, "created_at": "2025-06-03T10:20:08.458597+00:00"} {"global_step": 237910, "acc_step": 0, "speed/wps": 5506.862638107468, "speed/FLOPS": 243375141926184.0, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04929964616894722, "optim/lr": 3.870022578087662e-06, "optim/total_tokens": 1995733729280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2555087804794312, "created_at": "2025-06-03T10:20:11.442167+00:00"} {"global_step": 237911, "acc_step": 0, "speed/wps": 5508.60465698326, "speed/FLOPS": 243452130244033.06, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047177754342556, "optim/lr": 3.866475352993337e-06, "optim/total_tokens": 1995742117888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.257662296295166, "created_at": "2025-06-03T10:20:14.425007+00:00"} {"global_step": 237912, "acc_step": 0, "speed/wps": 5510.811939522823, "speed/FLOPS": 243549680834385.56, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04775851592421532, "optim/lr": 3.862928127898791e-06, "optim/total_tokens": 1995750506496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.251935601234436, "created_at": "2025-06-03T10:20:17.406773+00:00"} {"global_step": 237913, "acc_step": 0, "speed/wps": 5513.369345461087, "speed/FLOPS": 243662705086866.6, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.9 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.9, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04794401675462723, "optim/lr": 3.859380902804244e-06, "optim/total_tokens": 1995758895104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2551764249801636, "created_at": "2025-06-03T10:20:20.382979+00:00"} {"global_step": 237914, "acc_step": 0, "speed/wps": 5520.886638902895, "speed/FLOPS": 243994930979998.66, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04745228961110115, "optim/lr": 3.855833677709697e-06, "optim/total_tokens": 1995767283712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.277127981185913, "created_at": "2025-06-03T10:20:23.354802+00:00"} {"global_step": 237915, "acc_step": 0, "speed/wps": 5516.858312985115, "speed/FLOPS": 243816899593273.97, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04630877450108528, "optim/lr": 3.852286452615372e-06, "optim/total_tokens": 1995775672320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.263126015663147, "created_at": "2025-06-03T10:20:26.331902+00:00"} {"global_step": 237916, "acc_step": 0, "speed/wps": 5518.923928077621, "speed/FLOPS": 243908189207586.25, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04726845771074295, "optim/lr": 3.8487392275208255e-06, "optim/total_tokens": 1995784060928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2503191232681274, "created_at": "2025-06-03T10:20:29.306487+00:00"} {"global_step": 237917, "acc_step": 0, "speed/wps": 5520.642261118284, "speed/FLOPS": 243984130732757.75, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04791700839996338, "optim/lr": 3.845192002426279e-06, "optim/total_tokens": 1995792449536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2631182670593262, "created_at": "2025-06-03T10:20:32.278580+00:00"} {"global_step": 237918, "acc_step": 0, "speed/wps": 5519.661835568867, "speed/FLOPS": 243940800941746.38, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04687894508242607, "optim/lr": 3.841644777331732e-06, "optim/total_tokens": 1995800838144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2565901279449463, "created_at": "2025-06-03T10:20:35.252063+00:00"} {"global_step": 237919, "acc_step": 0, "speed/wps": 5515.998299603645, "speed/FLOPS": 243778891403760.53, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04693802073597908, "optim/lr": 3.838097552237407e-06, "optim/total_tokens": 1995809226752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2485411167144775, "created_at": "2025-06-03T10:20:38.226527+00:00"} {"global_step": 237920, "acc_step": 0, "speed/wps": 5529.610249506756, "speed/FLOPS": 244380469917202.5, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0468214675784111, "optim/lr": 3.83455032714286e-06, "optim/total_tokens": 1995817615360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.262520670890808, "created_at": "2025-06-03T10:20:41.197626+00:00"} {"global_step": 237921, "acc_step": 0, "speed/wps": 5526.091393397929, "speed/FLOPS": 244224954488330.66, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048077717423439026, "optim/lr": 3.831003102048314e-06, "optim/total_tokens": 1995826003968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2628862857818604, "created_at": "2025-06-03T10:20:44.171160+00:00"} {"global_step": 237922, "acc_step": 0, "speed/wps": 5517.978167620529, "speed/FLOPS": 243866391436223.66, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04692555591464043, "optim/lr": 3.827455876953767e-06, "optim/total_tokens": 1995834392576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2478729486465454, "created_at": "2025-06-03T10:20:47.144073+00:00"} {"global_step": 237923, "acc_step": 0, "speed/wps": 5526.491551313303, "speed/FLOPS": 244242639419996.28, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04706528037786484, "optim/lr": 3.823908651859442e-06, "optim/total_tokens": 1995842781184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2502974271774292, "created_at": "2025-06-03T10:20:50.113137+00:00"} {"global_step": 237924, "acc_step": 0, "speed/wps": 5521.862196019369, "speed/FLOPS": 244038045611192.8, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04671026021242142, "optim/lr": 3.820361426764896e-06, "optim/total_tokens": 1995851169792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2541190385818481, "created_at": "2025-06-03T10:20:53.084278+00:00"} {"global_step": 237925, "acc_step": 0, "speed/wps": 5515.667757112532, "speed/FLOPS": 243764283117523.16, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.048707082867622375, "optim/lr": 3.816814201670349e-06, "optim/total_tokens": 1995859558400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2505130767822266, "created_at": "2025-06-03T10:20:56.062642+00:00"} {"global_step": 237926, "acc_step": 0, "speed/wps": 5512.752078650976, "speed/FLOPS": 243635425053317.62, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0469934307038784, "optim/lr": 3.813266976575802e-06, "optim/total_tokens": 1995867947008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264034628868103, "created_at": "2025-06-03T10:20:59.038750+00:00"} {"global_step": 237927, "acc_step": 0, "speed/wps": 5513.827600442803, "speed/FLOPS": 243682957611496.8, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.89 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.89, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04830654338002205, "optim/lr": 3.8097197514814776e-06, "optim/total_tokens": 1995876335616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.252187967300415, "created_at": "2025-06-03T10:21:02.014726+00:00"} {"global_step": 237928, "acc_step": 0, "speed/wps": 5534.453325953725, "speed/FLOPS": 244594509107046.06, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046678632497787476, "optim/lr": 3.8061725263869307e-06, "optim/total_tokens": 1995884724224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2572429180145264, "created_at": "2025-06-03T10:21:04.979402+00:00"} {"global_step": 237929, "acc_step": 0, "speed/wps": 5525.405683215186, "speed/FLOPS": 244194649608036.3, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04699089005589485, "optim/lr": 3.802625301292384e-06, "optim/total_tokens": 1995893112832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2543275356292725, "created_at": "2025-06-03T10:21:07.949037+00:00"} {"global_step": 237930, "acc_step": 0, "speed/wps": 5539.194977499282, "speed/FLOPS": 244804065835386.94, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.43, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04989755526185036, "optim/lr": 3.799078076197837e-06, "optim/total_tokens": 1995901501440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2490237951278687, "created_at": "2025-06-03T10:21:10.915333+00:00"} {"global_step": 237931, "acc_step": 0, "speed/wps": 5510.515716644792, "speed/FLOPS": 243536589299382.72, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04628791660070419, "optim/lr": 3.7955308511035126e-06, "optim/total_tokens": 1995909890048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2517688274383545, "created_at": "2025-06-03T10:21:13.893777+00:00"} {"global_step": 237932, "acc_step": 0, "speed/wps": 5539.368325942388, "speed/FLOPS": 244811726949294.47, "speed/curr_iter_time": 2.9555, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9555, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04639822244644165, "optim/lr": 3.791983626008966e-06, "optim/total_tokens": 1995918278656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2739866971969604, "created_at": "2025-06-03T10:21:16.855512+00:00"} {"global_step": 237933, "acc_step": 0, "speed/wps": 5529.439403467466, "speed/FLOPS": 244372919396735.16, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.77, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04668709263205528, "optim/lr": 3.788436400914419e-06, "optim/total_tokens": 1995926667264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2617970705032349, "created_at": "2025-06-03T10:21:19.824686+00:00"} {"global_step": 237934, "acc_step": 0, "speed/wps": 5515.129542819477, "speed/FLOPS": 243740496800600.62, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046923693269491196, "optim/lr": 3.784889175820094e-06, "optim/total_tokens": 1995935055872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2651039361953735, "created_at": "2025-06-03T10:21:22.799802+00:00"} {"global_step": 237935, "acc_step": 0, "speed/wps": 5516.606276987136, "speed/FLOPS": 243805760892200.47, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.049091096967458725, "optim/lr": 3.7813419507255477e-06, "optim/total_tokens": 1995943444480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2440052032470703, "created_at": "2025-06-03T10:21:25.774128+00:00"} {"global_step": 237936, "acc_step": 0, "speed/wps": 5529.802341595107, "speed/FLOPS": 244388959404291.12, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.88 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.88, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04812365770339966, "optim/lr": 3.777794725631001e-06, "optim/total_tokens": 1995951833088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2596768140792847, "created_at": "2025-06-03T10:21:28.741395+00:00"} {"global_step": 237937, "acc_step": 0, "speed/wps": 5539.693531740021, "speed/FLOPS": 244826099380995.7, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047000885009765625, "optim/lr": 3.774247500536454e-06, "optim/total_tokens": 1995960221696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.242264747619629, "created_at": "2025-06-03T10:21:31.705741+00:00"} {"global_step": 237938, "acc_step": 0, "speed/wps": 5531.9527543301165, "speed/FLOPS": 244483996640368.4, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.69, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04864652082324028, "optim/lr": 3.770700275442129e-06, "optim/total_tokens": 1995968610304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2599469423294067, "created_at": "2025-06-03T10:21:34.675605+00:00"} {"global_step": 237939, "acc_step": 0, "speed/wps": 5529.999775418749, "speed/FLOPS": 244397684968738.22, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.051069196313619614, "optim/lr": 3.7671530503475828e-06, "optim/total_tokens": 1995976998912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2735800743103027, "created_at": "2025-06-03T10:21:37.646472+00:00"} {"global_step": 237940, "acc_step": 0, "speed/wps": 5520.02582129066, "speed/FLOPS": 243956887247601.84, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04705885425209999, "optim/lr": 3.763605825253036e-06, "optim/total_tokens": 1995985387520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2696291208267212, "created_at": "2025-06-03T10:21:40.621219+00:00"} {"global_step": 237941, "acc_step": 0, "speed/wps": 5524.471056696357, "speed/FLOPS": 244153343899756.22, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04680319130420685, "optim/lr": 3.760058600158489e-06, "optim/total_tokens": 1995993776128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2664963006973267, "created_at": "2025-06-03T10:21:43.594388+00:00"} {"global_step": 237942, "acc_step": 0, "speed/wps": 5523.228787180439, "speed/FLOPS": 244098441945664.47, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04654410481452942, "optim/lr": 3.7565113750641643e-06, "optim/total_tokens": 1996002164736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2795108556747437, "created_at": "2025-06-03T10:21:46.565221+00:00"} {"global_step": 237943, "acc_step": 0, "speed/wps": 5511.009619976036, "speed/FLOPS": 243558417298597.3, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04725034907460213, "optim/lr": 3.752964149969618e-06, "optim/total_tokens": 1996010553344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.259840488433838, "created_at": "2025-06-03T10:21:49.546543+00:00"} {"global_step": 237944, "acc_step": 0, "speed/wps": 5519.5256811932495, "speed/FLOPS": 243934783615245.38, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.050898097455501556, "optim/lr": 3.749416924875071e-06, "optim/total_tokens": 1996018941952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.251064419746399, "created_at": "2025-06-03T10:21:52.523945+00:00"} {"global_step": 237945, "acc_step": 0, "speed/wps": 5526.908466334283, "speed/FLOPS": 244261064929959.06, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04681803658604622, "optim/lr": 3.7458696997805242e-06, "optim/total_tokens": 1996027330560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2751221656799316, "created_at": "2025-06-03T10:21:55.492708+00:00"} {"global_step": 237946, "acc_step": 0, "speed/wps": 5529.642632694515, "speed/FLOPS": 244381901088349.25, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047438591718673706, "optim/lr": 3.7423224746861993e-06, "optim/total_tokens": 1996035719168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2697025537490845, "created_at": "2025-06-03T10:21:58.460346+00:00"} {"global_step": 237947, "acc_step": 0, "speed/wps": 5523.95891223023, "speed/FLOPS": 244130709735746.47, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04835103452205658, "optim/lr": 3.7387752495916525e-06, "optim/total_tokens": 1996044107776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2729315757751465, "created_at": "2025-06-03T10:22:01.430337+00:00"} {"global_step": 237948, "acc_step": 0, "speed/wps": 5530.620741872831, "speed/FLOPS": 244425128507614.2, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04726403206586838, "optim/lr": 3.735228024497106e-06, "optim/total_tokens": 1996052496384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2635339498519897, "created_at": "2025-06-03T10:22:04.396969+00:00"} {"global_step": 237949, "acc_step": 0, "speed/wps": 5519.9688341425035, "speed/FLOPS": 243954368707339.97, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04695191979408264, "optim/lr": 3.7316807994025593e-06, "optim/total_tokens": 1996060884992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2680050134658813, "created_at": "2025-06-03T10:22:07.369493+00:00"} {"global_step": 237950, "acc_step": 0, "speed/wps": 5525.788307337936, "speed/FLOPS": 244211559635814.06, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04759970307350159, "optim/lr": 3.7281335743082344e-06, "optim/total_tokens": 1996069273600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2634222507476807, "created_at": "2025-06-03T10:22:10.338905+00:00"} {"global_step": 237951, "acc_step": 0, "speed/wps": 5516.4754368512595, "speed/FLOPS": 243799978427895.25, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.87 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.87, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04756704717874527, "optim/lr": 3.7245863492136876e-06, "optim/total_tokens": 1996077662208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2490200996398926, "created_at": "2025-06-03T10:22:13.312871+00:00"} {"global_step": 237952, "acc_step": 0, "speed/wps": 5515.534314022722, "speed/FLOPS": 243758385615977.25, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04758748412132263, "optim/lr": 3.721039124119141e-06, "optim/total_tokens": 1996086050816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2662718296051025, "created_at": "2025-06-03T10:22:16.287754+00:00"} {"global_step": 237953, "acc_step": 0, "speed/wps": 5506.1004351554775, "speed/FLOPS": 243341456457014.38, "speed/curr_iter_time": 2.9733, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9733, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046584729105234146, "optim/lr": 3.7174918990245944e-06, "optim/total_tokens": 1996094439424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2632874250411987, "created_at": "2025-06-03T10:22:19.273153+00:00"} {"global_step": 237954, "acc_step": 0, "speed/wps": 5523.4612718289845, "speed/FLOPS": 244108716577165.88, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04764282703399658, "optim/lr": 3.7139446739302695e-06, "optim/total_tokens": 1996102828032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2494159936904907, "created_at": "2025-06-03T10:22:22.247716+00:00"} {"global_step": 237955, "acc_step": 0, "speed/wps": 5526.2097798582845, "speed/FLOPS": 244230186563921.53, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 195.9, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.0465010330080986, "optim/lr": 3.7103974488357227e-06, "optim/total_tokens": 1996111216640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2653651237487793, "created_at": "2025-06-03T10:22:25.217563+00:00"} {"global_step": 237956, "acc_step": 0, "speed/wps": 5519.024556066818, "speed/FLOPS": 243912636449648.03, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04613661393523216, "optim/lr": 3.7068502237411763e-06, "optim/total_tokens": 1996119605248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2579319477081299, "created_at": "2025-06-03T10:22:28.192687+00:00"} {"global_step": 237957, "acc_step": 0, "speed/wps": 5527.08733183497, "speed/FLOPS": 244268969869572.84, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046545639634132385, "optim/lr": 3.7033029986466294e-06, "optim/total_tokens": 1996127993856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2469490766525269, "created_at": "2025-06-03T10:22:31.165404+00:00"} {"global_step": 237958, "acc_step": 0, "speed/wps": 5526.298225724579, "speed/FLOPS": 244234095418504.78, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047360360622406006, "optim/lr": 3.6997557735523046e-06, "optim/total_tokens": 1996136382464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2407118082046509, "created_at": "2025-06-03T10:22:34.134444+00:00"} {"global_step": 237959, "acc_step": 0, "speed/wps": 5522.708421868866, "speed/FLOPS": 244075444462364.03, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04794502630829811, "optim/lr": 3.6962085484577577e-06, "optim/total_tokens": 1996144771072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2670704126358032, "created_at": "2025-06-03T10:22:37.105925+00:00"} {"global_step": 237960, "acc_step": 0, "speed/wps": 5517.396990651596, "speed/FLOPS": 243840706388930.2, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.86 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.86, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04629407078027725, "optim/lr": 3.6926613233632113e-06, "optim/total_tokens": 1996153159680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2560789585113525, "created_at": "2025-06-03T10:22:40.079820+00:00"} {"global_step": 237961, "acc_step": 0, "speed/wps": 5531.37890083037, "speed/FLOPS": 244458635252928.1, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047306351363658905, "optim/lr": 3.6891140982688864e-06, "optim/total_tokens": 1996161548288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2418969869613647, "created_at": "2025-06-03T10:22:43.050635+00:00"} {"global_step": 237962, "acc_step": 0, "speed/wps": 5528.959214815637, "speed/FLOPS": 244351697516152.66, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04770016670227051, "optim/lr": 3.6855668731743396e-06, "optim/total_tokens": 1996169936896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.267057180404663, "created_at": "2025-06-03T10:22:46.018286+00:00"} {"global_step": 237963, "acc_step": 0, "speed/wps": 5526.277199849877, "speed/FLOPS": 244233166182463.12, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04697008058428764, "optim/lr": 3.682019648079793e-06, "optim/total_tokens": 1996178325504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2593340873718262, "created_at": "2025-06-03T10:22:48.987009+00:00"} {"global_step": 237964, "acc_step": 0, "speed/wps": 5533.2377392746275, "speed/FLOPS": 244540786397766.62, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04692627489566803, "optim/lr": 3.678472422985246e-06, "optim/total_tokens": 1996186714112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2632182836532593, "created_at": "2025-06-03T10:22:51.952460+00:00"} {"global_step": 237965, "acc_step": 0, "speed/wps": 5519.261851773246, "speed/FLOPS": 243923123705282.6, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04663128778338432, "optim/lr": 3.6749251978909215e-06, "optim/total_tokens": 1996195102720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2706847190856934, "created_at": "2025-06-03T10:22:54.925124+00:00"} {"global_step": 237966, "acc_step": 0, "speed/wps": 5538.789675472722, "speed/FLOPS": 244786153560336.8, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.39, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046991199254989624, "optim/lr": 3.6713779727963747e-06, "optim/total_tokens": 1996203491328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.261542558670044, "created_at": "2025-06-03T10:22:57.888211+00:00"} {"global_step": 237967, "acc_step": 0, "speed/wps": 5517.905390002626, "speed/FLOPS": 243863175038021.9, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047451697289943695, "optim/lr": 3.667830747701828e-06, "optim/total_tokens": 1996211879936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2781403064727783, "created_at": "2025-06-03T10:23:00.861424+00:00"} {"global_step": 237968, "acc_step": 0, "speed/wps": 5516.6561525490715, "speed/FLOPS": 243807965136751.75, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04722404107451439, "optim/lr": 3.664283522607281e-06, "optim/total_tokens": 1996220268544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2530242204666138, "created_at": "2025-06-03T10:23:03.835861+00:00"} {"global_step": 237969, "acc_step": 0, "speed/wps": 5513.01606524364, "speed/FLOPS": 243647091909507.5, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047278035432100296, "optim/lr": 3.6607362975129566e-06, "optim/total_tokens": 1996228657152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2673099040985107, "created_at": "2025-06-03T10:23:06.811845+00:00"} {"global_step": 237970, "acc_step": 0, "speed/wps": 5532.856076585547, "speed/FLOPS": 244523918860436.0, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04766825959086418, "optim/lr": 3.6571890724184098e-06, "optim/total_tokens": 1996237045760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2733930349349976, "created_at": "2025-06-03T10:23:09.779526+00:00"} {"global_step": 237971, "acc_step": 0, "speed/wps": 5525.415714051829, "speed/FLOPS": 244195092919673.44, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046957943588495255, "optim/lr": 3.653641847323863e-06, "optim/total_tokens": 1996245434368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2449241876602173, "created_at": "2025-06-03T10:23:12.749402+00:00"} {"global_step": 237972, "acc_step": 0, "speed/wps": 5528.93369466295, "speed/FLOPS": 244350569656027.88, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04762759804725647, "optim/lr": 3.650094622229316e-06, "optim/total_tokens": 1996253822976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2780632972717285, "created_at": "2025-06-03T10:23:15.721157+00:00"} {"global_step": 237973, "acc_step": 0, "speed/wps": 5525.329142883267, "speed/FLOPS": 244191266917134.4, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.85 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.85, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04699266701936722, "optim/lr": 3.6465473971349917e-06, "optim/total_tokens": 1996262211584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2605090141296387, "created_at": "2025-06-03T10:23:18.690834+00:00"} {"global_step": 237974, "acc_step": 0, "speed/wps": 5526.386180515288, "speed/FLOPS": 244237982570060.7, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046547453850507736, "optim/lr": 3.643000172040445e-06, "optim/total_tokens": 1996270600192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.261794090270996, "created_at": "2025-06-03T10:23:21.661994+00:00"} {"global_step": 237975, "acc_step": 0, "speed/wps": 5530.609730624166, "speed/FLOPS": 244424641866783.9, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.049043476581573486, "optim/lr": 3.639452946945898e-06, "optim/total_tokens": 1996278988800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2554858922958374, "created_at": "2025-06-03T10:23:24.628250+00:00"} {"global_step": 237976, "acc_step": 0, "speed/wps": 5520.137428698871, "speed/FLOPS": 243961819723786.25, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04679388552904129, "optim/lr": 3.6359057218513512e-06, "optim/total_tokens": 1996287377408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2633239030838013, "created_at": "2025-06-03T10:23:27.600266+00:00"} {"global_step": 237977, "acc_step": 0, "speed/wps": 5518.463220051895, "speed/FLOPS": 243887828270966.62, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.04702577739953995, "optim/lr": 3.6323584967570267e-06, "optim/total_tokens": 1996295766016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2519372701644897, "created_at": "2025-06-03T10:23:30.573415+00:00"} {"global_step": 237978, "acc_step": 0, "speed/wps": 5532.907235250708, "speed/FLOPS": 244526179811582.34, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.047492071986198425, "optim/lr": 3.62881127166248e-06, "optim/total_tokens": 1996304154624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2513704299926758, "created_at": "2025-06-03T10:23:33.538787+00:00"} {"global_step": 237979, "acc_step": 0, "speed/wps": 5534.954450645634, "speed/FLOPS": 244616656253439.75, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 195.52, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046754952520132065, "optim/lr": 3.625264046567933e-06, "optim/total_tokens": 1996312543232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2654927968978882, "created_at": "2025-06-03T10:23:36.502908+00:00"} {"global_step": 237980, "acc_step": 0, "speed/wps": 5534.2321150070175, "speed/FLOPS": 244584732715461.88, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046693503856658936, "optim/lr": 3.6217168214733863e-06, "optim/total_tokens": 1996320931840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2715051174163818, "created_at": "2025-06-03T10:23:39.472958+00:00"} {"global_step": 237981, "acc_step": 0, "speed/wps": 5523.335344712868, "speed/FLOPS": 244103151243186.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04792996868491173, "optim/lr": 3.618169596379062e-06, "optim/total_tokens": 1996329320448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2497912645339966, "created_at": "2025-06-03T10:23:42.449019+00:00"} {"global_step": 237982, "acc_step": 0, "speed/wps": 5511.560305632021, "speed/FLOPS": 243582754785927.1, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.04, "optim/grad_norm": 0.046606115996837616, "optim/lr": 3.614622371284515e-06, "optim/total_tokens": 1996337709056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2466298341751099, "created_at": "2025-06-03T10:23:45.426955+00:00"} {"global_step": 237983, "acc_step": 0, "speed/wps": 5520.654657654783, "speed/FLOPS": 243984678596219.75, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04686535894870758, "optim/lr": 3.611075146189968e-06, "optim/total_tokens": 1996346097664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2637269496917725, "created_at": "2025-06-03T10:23:48.398686+00:00"} {"global_step": 237984, "acc_step": 0, "speed/wps": 5536.898577574326, "speed/FLOPS": 244702576712744.25, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04681699350476265, "optim/lr": 3.6075279210954214e-06, "optim/total_tokens": 1996354486272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.25495445728302, "created_at": "2025-06-03T10:23:51.364713+00:00"} {"global_step": 237985, "acc_step": 0, "speed/wps": 5517.214194615904, "speed/FLOPS": 243832627739787.5, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.84 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.84, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04684494063258171, "optim/lr": 3.603980696001097e-06, "optim/total_tokens": 1996362874880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2725627422332764, "created_at": "2025-06-03T10:23:54.340111+00:00"} {"global_step": 237986, "acc_step": 0, "speed/wps": 5534.795298571559, "speed/FLOPS": 244609622546379.8, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.53, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047311313450336456, "optim/lr": 3.60043347090655e-06, "optim/total_tokens": 1996371263488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2518707513809204, "created_at": "2025-06-03T10:23:57.305808+00:00"} {"global_step": 237987, "acc_step": 0, "speed/wps": 5520.383508796761, "speed/FLOPS": 243972695204560.88, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04706304892897606, "optim/lr": 3.5968862458120033e-06, "optim/total_tokens": 1996379652096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2778851985931396, "created_at": "2025-06-03T10:24:00.281434+00:00"} {"global_step": 237988, "acc_step": 0, "speed/wps": 5535.111605184866, "speed/FLOPS": 244623601679683.94, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.61, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04640214517712593, "optim/lr": 3.593339020717679e-06, "optim/total_tokens": 1996388040704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2504181861877441, "created_at": "2025-06-03T10:24:03.245563+00:00"} {"global_step": 237989, "acc_step": 0, "speed/wps": 5519.338856144158, "speed/FLOPS": 243926526904332.8, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047044433653354645, "optim/lr": 3.589791795623132e-06, "optim/total_tokens": 1996396429312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2789924144744873, "created_at": "2025-06-03T10:24:06.220010+00:00"} {"global_step": 237990, "acc_step": 0, "speed/wps": 5522.4371639816745, "speed/FLOPS": 244063456252173.9, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04940023273229599, "optim/lr": 3.586244570528585e-06, "optim/total_tokens": 1996404817920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2714022397994995, "created_at": "2025-06-03T10:24:09.191123+00:00"} {"global_step": 237991, "acc_step": 0, "speed/wps": 5523.317478406731, "speed/FLOPS": 244102361643903.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04708600789308548, "optim/lr": 3.5826973454340383e-06, "optim/total_tokens": 1996413206528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.258867621421814, "created_at": "2025-06-03T10:24:12.161604+00:00"} {"global_step": 237992, "acc_step": 0, "speed/wps": 5521.443533063408, "speed/FLOPS": 244019542851450.6, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048051994293928146, "optim/lr": 3.5791501203397134e-06, "optim/total_tokens": 1996421595136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2578140497207642, "created_at": "2025-06-03T10:24:15.135941+00:00"} {"global_step": 237993, "acc_step": 0, "speed/wps": 5526.1174953115315, "speed/FLOPS": 244226108059310.16, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048281241208314896, "optim/lr": 3.575602895245167e-06, "optim/total_tokens": 1996429983744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.262751579284668, "created_at": "2025-06-03T10:24:18.108372+00:00"} {"global_step": 237994, "acc_step": 0, "speed/wps": 5515.904469367944, "speed/FLOPS": 243774744587609.25, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047859832644462585, "optim/lr": 3.5720556701506202e-06, "optim/total_tokens": 1996438372352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2637929916381836, "created_at": "2025-06-03T10:24:21.082878+00:00"} {"global_step": 237995, "acc_step": 0, "speed/wps": 5532.700886689597, "speed/FLOPS": 244517060261368.88, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04687456041574478, "optim/lr": 3.5685084450560734e-06, "optim/total_tokens": 1996446760960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2741574048995972, "created_at": "2025-06-03T10:24:24.048711+00:00"} {"global_step": 237996, "acc_step": 0, "speed/wps": 5532.300817724174, "speed/FLOPS": 244499379260835.78, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0467788502573967, "optim/lr": 3.5649612199617485e-06, "optim/total_tokens": 1996455149568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2690821886062622, "created_at": "2025-06-03T10:24:27.016152+00:00"} {"global_step": 237997, "acc_step": 0, "speed/wps": 5517.694023053802, "speed/FLOPS": 243853833700758.03, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0471719466149807, "optim/lr": 3.561413994867202e-06, "optim/total_tokens": 1996463538176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.270504355430603, "created_at": "2025-06-03T10:24:29.990019+00:00"} {"global_step": 237998, "acc_step": 0, "speed/wps": 5519.531339672778, "speed/FLOPS": 243935033691077.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.83 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.83, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047699250280857086, "optim/lr": 3.5578667697726553e-06, "optim/total_tokens": 1996471926784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2678860425949097, "created_at": "2025-06-03T10:24:32.962869+00:00"} {"global_step": 237999, "acc_step": 0, "speed/wps": 5531.786566988373, "speed/FLOPS": 244476652010487.28, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.82 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.82, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04835880920290947, "optim/lr": 3.5543195446781085e-06, "optim/total_tokens": 1996480315392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2592486143112183, "created_at": "2025-06-03T10:24:35.929340+00:00"} {"global_step": 238000, "acc_step": 0, "speed/wps": 5527.948794447337, "speed/FLOPS": 244307042107674.06, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.82 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.82, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04610853269696236, "optim/lr": 3.5507723195837836e-06, "optim/total_tokens": 1996488704000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.256993055343628, "created_at": "2025-06-03T10:24:38.898135+00:00"} {"global_step": 238001, "acc_step": 0, "speed/wps": 225.5882367158724, "speed/FLOPS": 9969845397573.105, "speed/curr_iter_time": 5.7529, "speed/data_load_time": 3.4265, "speed/curr_step_time": 5.7529, "speed/est_time_elapsed": "15.85 days", "speed/est_time_remaining": "1.6 hours", "speed/est_time_elapsed_hrs": 380.33, "speed/est_time_elapsed_days": 15.85, "speed/est_time_remaining_hrs": 1.6, "speed/est_time_remaining_days": 0.07, "optim/grad_norm": 0.048364926129579544, "optim/lr": 3.547225094489237e-06, "optim/total_tokens": 1996497092608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.258825421333313, "created_at": "2025-06-03T10:25:51.534573+00:00"} {"global_step": 238002, "acc_step": 0, "speed/wps": 5610.311678069334, "speed/FLOPS": 247947059992311.6, "speed/curr_iter_time": 2.9167, "speed/data_load_time": 0.0015, "speed/curr_step_time": 2.9167, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 192.83, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04707122594118118, "optim/lr": 3.5436778693946904e-06, "optim/total_tokens": 1996505481216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2629337310791016, "created_at": "2025-06-03T10:25:54.462453+00:00"} {"global_step": 238003, "acc_step": 0, "speed/wps": 5564.856541476668, "speed/FLOPS": 245938175615396.03, "speed/curr_iter_time": 2.9419, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9419, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.49, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04697079584002495, "optim/lr": 3.5401306443001436e-06, "optim/total_tokens": 1996513869824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.264727234840393, "created_at": "2025-06-03T10:25:57.414693+00:00"} {"global_step": 238004, "acc_step": 0, "speed/wps": 5568.665723168556, "speed/FLOPS": 246106521949018.1, "speed/curr_iter_time": 2.9409, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9409, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.43, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04722373187541962, "optim/lr": 3.5365834192058187e-06, "optim/total_tokens": 1996522258432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2706387042999268, "created_at": "2025-06-03T10:26:00.361672+00:00"} {"global_step": 238005, "acc_step": 0, "speed/wps": 5556.13675959811, "speed/FLOPS": 245552805888253.38, "speed/curr_iter_time": 2.9476, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9476, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.87, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0462399385869503, "optim/lr": 3.5330361941112723e-06, "optim/total_tokens": 1996530647040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2673636674880981, "created_at": "2025-06-03T10:26:03.319304+00:00"} {"global_step": 238006, "acc_step": 0, "speed/wps": 5576.3035884961955, "speed/FLOPS": 246444076502361.06, "speed/curr_iter_time": 2.937, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.937, "speed/est_time_elapsed": "8.09 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.17, "speed/est_time_elapsed_days": 8.09, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04752301797270775, "optim/lr": 3.5294889690167255e-06, "optim/total_tokens": 1996539035648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2593998908996582, "created_at": "2025-06-03T10:26:06.265030+00:00"} {"global_step": 238007, "acc_step": 0, "speed/wps": 5543.824721018639, "speed/FLOPS": 245008676801767.0, "speed/curr_iter_time": 2.9528, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9528, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.22, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046976760029792786, "optim/lr": 3.5259417439221786e-06, "optim/total_tokens": 1996547424256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 358, "loss/out": 1.2686711549758911, "created_at": "2025-06-03T10:26:09.229558+00:00"} {"global_step": 238008, "acc_step": 0, "speed/wps": 5542.45872105921, "speed/FLOPS": 244948306595381.84, "speed/curr_iter_time": 2.9549, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9549, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.36, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.06051131710410118, "optim/lr": 3.5223945188278537e-06, "optim/total_tokens": 1996555812864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.25760817527771, "created_at": "2025-06-03T10:26:12.193163+00:00"} {"global_step": 238009, "acc_step": 0, "speed/wps": 5546.167447648407, "speed/FLOPS": 245112213327640.8, "speed/curr_iter_time": 2.953, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.953, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.23, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0471101850271225, "optim/lr": 3.5188472937333074e-06, "optim/total_tokens": 1996564201472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2703713178634644, "created_at": "2025-06-03T10:26:15.154216+00:00"} {"global_step": 238010, "acc_step": 0, "speed/wps": 5537.376833399191, "speed/FLOPS": 244723713172268.06, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04667848348617554, "optim/lr": 3.5153000686387605e-06, "optim/total_tokens": 1996572590080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2745535373687744, "created_at": "2025-06-03T10:26:18.120870+00:00"} {"global_step": 238011, "acc_step": 0, "speed/wps": 5523.324529798358, "speed/FLOPS": 244102673279321.3, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04671628028154373, "optim/lr": 3.5117528435442137e-06, "optim/total_tokens": 1996580978688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2505625486373901, "created_at": "2025-06-03T10:26:21.095999+00:00"} {"global_step": 238012, "acc_step": 0, "speed/wps": 5530.047383274212, "speed/FLOPS": 244399788992270.6, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046976178884506226, "optim/lr": 3.508205618449889e-06, "optim/total_tokens": 1996589367296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2541730403900146, "created_at": "2025-06-03T10:26:24.067249+00:00"} {"global_step": 238013, "acc_step": 0, "speed/wps": 5538.095778569411, "speed/FLOPS": 244755486868896.8, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.45, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04785105958580971, "optim/lr": 3.504658393355342e-06, "optim/total_tokens": 1996597755904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2735450267791748, "created_at": "2025-06-03T10:26:27.033821+00:00"} {"global_step": 238014, "acc_step": 0, "speed/wps": 5554.503745758919, "speed/FLOPS": 245480635035083.7, "speed/curr_iter_time": 2.9486, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9486, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.95, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04708443582057953, "optim/lr": 3.5011111682607956e-06, "optim/total_tokens": 1996606144512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2614576816558838, "created_at": "2025-06-03T10:26:29.992302+00:00"} {"global_step": 238015, "acc_step": 0, "speed/wps": 5554.260497310911, "speed/FLOPS": 245469884698740.16, "speed/curr_iter_time": 2.9488, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9488, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 194.96, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.049058232456445694, "optim/lr": 3.497563943166249e-06, "optim/total_tokens": 1996614533120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2643071413040161, "created_at": "2025-06-03T10:26:32.946529+00:00"} {"global_step": 238016, "acc_step": 0, "speed/wps": 5543.3990600015, "speed/FLOPS": 244989864763540.06, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.34, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05074480548501015, "optim/lr": 3.494016718071924e-06, "optim/total_tokens": 1996622921728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2460176944732666, "created_at": "2025-06-03T10:26:35.907105+00:00"} {"global_step": 238017, "acc_step": 0, "speed/wps": 5529.529600827526, "speed/FLOPS": 244376905658377.9, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046992767602205276, "optim/lr": 3.490469492977377e-06, "optim/total_tokens": 1996631310336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.260751724243164, "created_at": "2025-06-03T10:26:38.874854+00:00"} {"global_step": 238018, "acc_step": 0, "speed/wps": 5537.264132608082, "speed/FLOPS": 244718732374155.97, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.56, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046742018312215805, "optim/lr": 3.4869222678828307e-06, "optim/total_tokens": 1996639698944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2438386678695679, "created_at": "2025-06-03T10:26:41.840522+00:00"} {"global_step": 238019, "acc_step": 0, "speed/wps": 5514.179941595084, "speed/FLOPS": 243698529286982.12, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04641303792595863, "optim/lr": 3.483375042788506e-06, "optim/total_tokens": 1996648087552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2680007219314575, "created_at": "2025-06-03T10:26:44.818497+00:00"} {"global_step": 238020, "acc_step": 0, "speed/wps": 5534.0895159380225, "speed/FLOPS": 244578430566500.5, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 195.59, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04685739427804947, "optim/lr": 3.479827817693959e-06, "optim/total_tokens": 1996656476160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2734599113464355, "created_at": "2025-06-03T10:26:47.786501+00:00"} {"global_step": 238021, "acc_step": 0, "speed/wps": 5515.033647974298, "speed/FLOPS": 243736258739278.03, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04647129401564598, "optim/lr": 3.476280592599412e-06, "optim/total_tokens": 1996664864768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2679202556610107, "created_at": "2025-06-03T10:26:50.765673+00:00"} {"global_step": 238022, "acc_step": 0, "speed/wps": 5532.371255807181, "speed/FLOPS": 244502492263569.9, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.74, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046563901007175446, "optim/lr": 3.4727333675048658e-06, "optim/total_tokens": 1996673253376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2671507596969604, "created_at": "2025-06-03T10:26:53.731937+00:00"} {"global_step": 238023, "acc_step": 0, "speed/wps": 5519.862373124182, "speed/FLOPS": 243949663675247.06, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.81 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.81, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04682100564241409, "optim/lr": 3.469186142410541e-06, "optim/total_tokens": 1996681641984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2764989137649536, "created_at": "2025-06-03T10:26:56.708602+00:00"} {"global_step": 238024, "acc_step": 0, "speed/wps": 5538.376181623788, "speed/FLOPS": 244767879248667.34, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.44, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048371780663728714, "optim/lr": 3.465638917315994e-06, "optim/total_tokens": 1996690030592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.239941120147705, "created_at": "2025-06-03T10:26:59.671841+00:00"} {"global_step": 238025, "acc_step": 0, "speed/wps": 5529.500221372074, "speed/FLOPS": 244375607236824.56, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0474100224673748, "optim/lr": 3.4620916922214472e-06, "optim/total_tokens": 1996698419200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.258704662322998, "created_at": "2025-06-03T10:27:02.643761+00:00"} {"global_step": 238026, "acc_step": 0, "speed/wps": 5524.755433848391, "speed/FLOPS": 244165911914301.9, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0467829667031765, "optim/lr": 3.458544467126901e-06, "optim/total_tokens": 1996706807808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2667866945266724, "created_at": "2025-06-03T10:27:05.613917+00:00"} {"global_step": 238027, "acc_step": 0, "speed/wps": 5531.810373152651, "speed/FLOPS": 244477704121097.34, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046797554939985275, "optim/lr": 3.454997242032576e-06, "optim/total_tokens": 1996715196416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.274721384048462, "created_at": "2025-06-03T10:27:08.581508+00:00"} {"global_step": 238028, "acc_step": 0, "speed/wps": 5529.130348326608, "speed/FLOPS": 244359260741396.88, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05071016401052475, "optim/lr": 3.451450016938029e-06, "optim/total_tokens": 1996723585024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2874878644943237, "created_at": "2025-06-03T10:27:11.553877+00:00"} {"global_step": 238029, "acc_step": 0, "speed/wps": 5530.268159403756, "speed/FLOPS": 244409546167161.75, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0482214018702507, "optim/lr": 3.4479027918434823e-06, "optim/total_tokens": 1996731973632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.256010890007019, "created_at": "2025-06-03T10:27:14.524513+00:00"} {"global_step": 238030, "acc_step": 0, "speed/wps": 5531.289517478702, "speed/FLOPS": 244454684966289.8, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04784902557730675, "optim/lr": 3.4443555667489355e-06, "optim/total_tokens": 1996740362240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2659196853637695, "created_at": "2025-06-03T10:27:17.493889+00:00"} {"global_step": 238031, "acc_step": 0, "speed/wps": 5515.411979030478, "speed/FLOPS": 243752979035487.28, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04781825840473175, "optim/lr": 3.440808341654611e-06, "optim/total_tokens": 1996748750848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2636264562606812, "created_at": "2025-06-03T10:27:20.471138+00:00"} {"global_step": 238032, "acc_step": 0, "speed/wps": 5534.2555583345475, "speed/FLOPS": 244585768790544.88, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047290146350860596, "optim/lr": 3.437261116560064e-06, "optim/total_tokens": 1996757139456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2542598247528076, "created_at": "2025-06-03T10:27:23.439975+00:00"} {"global_step": 238033, "acc_step": 0, "speed/wps": 5528.29962236711, "speed/FLOPS": 244322546906027.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046699874103069305, "optim/lr": 3.4337138914655174e-06, "optim/total_tokens": 1996765528064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.267698049545288, "created_at": "2025-06-03T10:27:26.412445+00:00"} {"global_step": 238034, "acc_step": 0, "speed/wps": 5524.865764701037, "speed/FLOPS": 244170787973264.38, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.8 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.8, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04621686786413193, "optim/lr": 3.4301666663709706e-06, "optim/total_tokens": 1996773916672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2750544548034668, "created_at": "2025-06-03T10:27:29.387303+00:00"} {"global_step": 238035, "acc_step": 0, "speed/wps": 5529.534523793914, "speed/FLOPS": 244377123228294.2, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046918537467718124, "optim/lr": 3.426619441276646e-06, "optim/total_tokens": 1996782305280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2530796527862549, "created_at": "2025-06-03T10:27:32.358294+00:00"} {"global_step": 238036, "acc_step": 0, "speed/wps": 5527.559163157332, "speed/FLOPS": 244289822398969.56, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04771003499627113, "optim/lr": 3.4230722161820993e-06, "optim/total_tokens": 1996790693888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2466557025909424, "created_at": "2025-06-03T10:27:35.326342+00:00"} {"global_step": 238037, "acc_step": 0, "speed/wps": 5533.450763940398, "speed/FLOPS": 244550200997634.6, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04721847176551819, "optim/lr": 3.4195249910875525e-06, "optim/total_tokens": 1996799082496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2574814558029175, "created_at": "2025-06-03T10:27:38.295057+00:00"} {"global_step": 238038, "acc_step": 0, "speed/wps": 5505.3580686865425, "speed/FLOPS": 243308647658863.5, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04751667380332947, "optim/lr": 3.4159777659930056e-06, "optim/total_tokens": 1996807471104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.269299030303955, "created_at": "2025-06-03T10:27:41.276743+00:00"} {"global_step": 238039, "acc_step": 0, "speed/wps": 5504.985181466112, "speed/FLOPS": 243292167952330.3, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.73, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04657502472400665, "optim/lr": 3.412430540898681e-06, "optim/total_tokens": 1996815859712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2459524869918823, "created_at": "2025-06-03T10:27:44.261494+00:00"} {"global_step": 238040, "acc_step": 0, "speed/wps": 5514.555893186441, "speed/FLOPS": 243715144423025.4, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04715627804398537, "optim/lr": 3.4088833158041344e-06, "optim/total_tokens": 1996824248320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2698580026626587, "created_at": "2025-06-03T10:27:47.236885+00:00"} {"global_step": 238041, "acc_step": 0, "speed/wps": 5527.610710658885, "speed/FLOPS": 244292100534694.22, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0492384135723114, "optim/lr": 3.4053360907095875e-06, "optim/total_tokens": 1996832636928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2534427642822266, "created_at": "2025-06-03T10:27:50.205560+00:00"} {"global_step": 238042, "acc_step": 0, "speed/wps": 5526.773371905288, "speed/FLOPS": 244255094447673.47, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04716124013066292, "optim/lr": 3.4017888656150407e-06, "optim/total_tokens": 1996841025536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.248394250869751, "created_at": "2025-06-03T10:27:53.179808+00:00"} {"global_step": 238043, "acc_step": 0, "speed/wps": 5530.582335269368, "speed/FLOPS": 244423431132323.94, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04725337401032448, "optim/lr": 3.3982416405207162e-06, "optim/total_tokens": 1996849414144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2608749866485596, "created_at": "2025-06-03T10:27:56.151242+00:00"} {"global_step": 238044, "acc_step": 0, "speed/wps": 5522.072236627225, "speed/FLOPS": 244047328330974.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04692515358328819, "optim/lr": 3.3946944154261694e-06, "optim/total_tokens": 1996857802752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2660022974014282, "created_at": "2025-06-03T10:27:59.127144+00:00"} {"global_step": 238045, "acc_step": 0, "speed/wps": 5521.852752637941, "speed/FLOPS": 244037628262069.3, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04718240723013878, "optim/lr": 3.3911471903316226e-06, "optim/total_tokens": 1996866191360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2746303081512451, "created_at": "2025-06-03T10:28:02.102570+00:00"} {"global_step": 238046, "acc_step": 0, "speed/wps": 5507.042616782253, "speed/FLOPS": 243383096062395.12, "speed/curr_iter_time": 2.9741, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9741, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04938759282231331, "optim/lr": 3.387599965237298e-06, "optim/total_tokens": 1996874579968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2586588859558105, "created_at": "2025-06-03T10:28:05.087062+00:00"} {"global_step": 238047, "acc_step": 0, "speed/wps": 5503.4591098316305, "speed/FLOPS": 243224723397228.94, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.79 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.79, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04815850034356117, "optim/lr": 3.3840527401427513e-06, "optim/total_tokens": 1996882968576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2695941925048828, "created_at": "2025-06-03T10:28:08.068548+00:00"} {"global_step": 238048, "acc_step": 0, "speed/wps": 5527.854748706832, "speed/FLOPS": 244302885767313.47, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04721270874142647, "optim/lr": 3.3805055150482045e-06, "optim/total_tokens": 1996891357184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.275383472442627, "created_at": "2025-06-03T10:28:11.040784+00:00"} {"global_step": 238049, "acc_step": 0, "speed/wps": 5522.043014795861, "speed/FLOPS": 244046036875599.38, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047504909336566925, "optim/lr": 3.3769582899536577e-06, "optim/total_tokens": 1996899745792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2688872814178467, "created_at": "2025-06-03T10:28:14.013801+00:00"} {"global_step": 238050, "acc_step": 0, "speed/wps": 5520.592456811797, "speed/FLOPS": 243981929637332.56, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04778151214122772, "optim/lr": 3.3734110648593332e-06, "optim/total_tokens": 1996908134400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2587497234344482, "created_at": "2025-06-03T10:28:16.986012+00:00"} {"global_step": 238051, "acc_step": 0, "speed/wps": 5522.887981809443, "speed/FLOPS": 244083380092666.44, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04624123498797417, "optim/lr": 3.3698638397647864e-06, "optim/total_tokens": 1996916523008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2549948692321777, "created_at": "2025-06-03T10:28:19.960774+00:00"} {"global_step": 238052, "acc_step": 0, "speed/wps": 5531.372788888966, "speed/FLOPS": 244458365136401.8, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04794562608003616, "optim/lr": 3.3663166146702396e-06, "optim/total_tokens": 1996924911616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2478784322738647, "created_at": "2025-06-03T10:28:22.927431+00:00"} {"global_step": 238053, "acc_step": 0, "speed/wps": 5519.203201667714, "speed/FLOPS": 243920531670816.53, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04733111709356308, "optim/lr": 3.3627693895756928e-06, "optim/total_tokens": 1996933300224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2631597518920898, "created_at": "2025-06-03T10:28:25.900538+00:00"} {"global_step": 238054, "acc_step": 0, "speed/wps": 5527.041945510255, "speed/FLOPS": 244266964026328.7, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046774595975875854, "optim/lr": 3.3592221644813683e-06, "optim/total_tokens": 1996941688832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.263363242149353, "created_at": "2025-06-03T10:28:28.869591+00:00"} {"global_step": 238055, "acc_step": 0, "speed/wps": 5514.740438498702, "speed/FLOPS": 243723300381238.84, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0471949502825737, "optim/lr": 3.3556749393868215e-06, "optim/total_tokens": 1996950077440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2826777696609497, "created_at": "2025-06-03T10:28:31.845156+00:00"} {"global_step": 238056, "acc_step": 0, "speed/wps": 5518.351235462924, "speed/FLOPS": 243882879125323.16, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04702937602996826, "optim/lr": 3.3521277142922747e-06, "optim/total_tokens": 1996958466048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.258551001548767, "created_at": "2025-06-03T10:28:34.818919+00:00"} {"global_step": 238057, "acc_step": 0, "speed/wps": 5515.954896491228, "speed/FLOPS": 243776973208348.97, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04746974632143974, "optim/lr": 3.348580489197728e-06, "optim/total_tokens": 1996966854656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2523186206817627, "created_at": "2025-06-03T10:28:37.794267+00:00"} {"global_step": 238058, "acc_step": 0, "speed/wps": 5514.980404468723, "speed/FLOPS": 243733905648856.56, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047168366611003876, "optim/lr": 3.345033264103403e-06, "optim/total_tokens": 1996975243264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2623651027679443, "created_at": "2025-06-03T10:28:40.775504+00:00"} {"global_step": 238059, "acc_step": 0, "speed/wps": 5520.561386583158, "speed/FLOPS": 243980556492258.6, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.78 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.78, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04663805291056633, "optim/lr": 3.3414860390088565e-06, "optim/total_tokens": 1996983631872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2649941444396973, "created_at": "2025-06-03T10:28:43.752392+00:00"} {"global_step": 238060, "acc_step": 0, "speed/wps": 5520.346211709685, "speed/FLOPS": 243971046864215.9, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04947597533464432, "optim/lr": 3.3379388139143097e-06, "optim/total_tokens": 1996992020480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2503328323364258, "created_at": "2025-06-03T10:28:46.728580+00:00"} {"global_step": 238061, "acc_step": 0, "speed/wps": 5517.232349784552, "speed/FLOPS": 243833430105315.2, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046813204884529114, "optim/lr": 3.334391588819763e-06, "optim/total_tokens": 1997000409088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2454500198364258, "created_at": "2025-06-03T10:28:49.706958+00:00"} {"global_step": 238062, "acc_step": 0, "speed/wps": 5511.1413128174, "speed/FLOPS": 243564237448120.5, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04662477225065231, "optim/lr": 3.330844363725438e-06, "optim/total_tokens": 1997008797696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2553304433822632, "created_at": "2025-06-03T10:28:52.684277+00:00"} {"global_step": 238063, "acc_step": 0, "speed/wps": 5517.174105294906, "speed/FLOPS": 243830855996995.2, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05033247917890549, "optim/lr": 3.3272971386308916e-06, "optim/total_tokens": 1997017186304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2757620811462402, "created_at": "2025-06-03T10:28:55.663016+00:00"} {"global_step": 238064, "acc_step": 0, "speed/wps": 5518.068968935097, "speed/FLOPS": 243870404389564.25, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04696772247552872, "optim/lr": 3.323749913536345e-06, "optim/total_tokens": 1997025574912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2589622735977173, "created_at": "2025-06-03T10:28:58.638070+00:00"} {"global_step": 238065, "acc_step": 0, "speed/wps": 5521.263428916316, "speed/FLOPS": 244011583170005.75, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04911221191287041, "optim/lr": 3.320202688441798e-06, "optim/total_tokens": 1997033963520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2507165670394897, "created_at": "2025-06-03T10:29:01.615002+00:00"} {"global_step": 238066, "acc_step": 0, "speed/wps": 5519.197269412178, "speed/FLOPS": 243920269495485.88, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047881241887807846, "optim/lr": 3.316655463347473e-06, "optim/total_tokens": 1997042352128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.259789228439331, "created_at": "2025-06-03T10:29:04.592029+00:00"} {"global_step": 238067, "acc_step": 0, "speed/wps": 5514.32854144468, "speed/FLOPS": 243705096639731.3, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04829651489853859, "optim/lr": 3.3131082382529267e-06, "optim/total_tokens": 1997050740736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2654061317443848, "created_at": "2025-06-03T10:29:07.568214+00:00"} {"global_step": 238068, "acc_step": 0, "speed/wps": 5527.266343065873, "speed/FLOPS": 244276881249716.2, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05007133260369301, "optim/lr": 3.30956101315838e-06, "optim/total_tokens": 1997059129344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.256630301475525, "created_at": "2025-06-03T10:29:10.536788+00:00"} {"global_step": 238069, "acc_step": 0, "speed/wps": 5528.4629694667055, "speed/FLOPS": 244329766011743.84, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04662400484085083, "optim/lr": 3.306013788063833e-06, "optim/total_tokens": 1997067517952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.249025821685791, "created_at": "2025-06-03T10:29:13.504867+00:00"} {"global_step": 238070, "acc_step": 0, "speed/wps": 5522.003116131307, "speed/FLOPS": 244044273558845.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04756566509604454, "optim/lr": 3.302466562969508e-06, "optim/total_tokens": 1997075906560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2643942832946777, "created_at": "2025-06-03T10:29:16.477194+00:00"} {"global_step": 238071, "acc_step": 0, "speed/wps": 5513.614319201154, "speed/FLOPS": 243673531672288.28, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04758460447192192, "optim/lr": 3.2989193378749618e-06, "optim/total_tokens": 1997084295168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2566062211990356, "created_at": "2025-06-03T10:29:19.455987+00:00"} {"global_step": 238072, "acc_step": 0, "speed/wps": 5517.744250999265, "speed/FLOPS": 243856053518857.56, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.77 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.77, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047884512692689896, "optim/lr": 3.295372112780415e-06, "optim/total_tokens": 1997092683776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.263624906539917, "created_at": "2025-06-03T10:29:22.432184+00:00"} {"global_step": 238073, "acc_step": 0, "speed/wps": 5531.9544408251295, "speed/FLOPS": 244484071174815.72, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04760724678635597, "optim/lr": 3.29182488768609e-06, "optim/total_tokens": 1997101072384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2587823867797852, "created_at": "2025-06-03T10:29:25.399125+00:00"} {"global_step": 238074, "acc_step": 0, "speed/wps": 5532.001757040395, "speed/FLOPS": 244486162309344.12, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0471494123339653, "optim/lr": 3.2882776625915432e-06, "optim/total_tokens": 1997109460992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2461004257202148, "created_at": "2025-06-03T10:29:28.367239+00:00"} {"global_step": 238075, "acc_step": 0, "speed/wps": 5527.569519213681, "speed/FLOPS": 244290280083653.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048580627888441086, "optim/lr": 3.2847304374969964e-06, "optim/total_tokens": 1997117849600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2588952779769897, "created_at": "2025-06-03T10:29:31.339170+00:00"} {"global_step": 238076, "acc_step": 0, "speed/wps": 5526.122421317565, "speed/FLOPS": 244226325763563.25, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04815656319260597, "optim/lr": 3.28118321240245e-06, "optim/total_tokens": 1997126238208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2689169645309448, "created_at": "2025-06-03T10:29:34.309182+00:00"} {"global_step": 238077, "acc_step": 0, "speed/wps": 5522.267835210507, "speed/FLOPS": 244055972787191.5, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05123043805360794, "optim/lr": 3.277635987308125e-06, "optim/total_tokens": 1997134626816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.2566090822219849, "created_at": "2025-06-03T10:29:37.285192+00:00"} {"global_step": 238078, "acc_step": 0, "speed/wps": 5520.661573614088, "speed/FLOPS": 243984984246221.97, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0469110831618309, "optim/lr": 3.2740887622135783e-06, "optim/total_tokens": 1997143015424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2674955129623413, "created_at": "2025-06-03T10:29:40.259321+00:00"} {"global_step": 238079, "acc_step": 0, "speed/wps": 5516.130067529403, "speed/FLOPS": 243784714871629.66, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04875180125236511, "optim/lr": 3.2705415371190315e-06, "optim/total_tokens": 1997151404032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.252064824104309, "created_at": "2025-06-03T10:29:43.238244+00:00"} {"global_step": 238080, "acc_step": 0, "speed/wps": 5513.077223850704, "speed/FLOPS": 243649794806901.62, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04898133873939514, "optim/lr": 3.266994312024485e-06, "optim/total_tokens": 1997159792640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.253310203552246, "created_at": "2025-06-03T10:29:46.214533+00:00"} {"global_step": 238081, "acc_step": 0, "speed/wps": 5520.348252311521, "speed/FLOPS": 243971137048372.3, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.045977745205163956, "optim/lr": 3.2634470869301602e-06, "optim/total_tokens": 1997168181248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.271704077720642, "created_at": "2025-06-03T10:29:49.186690+00:00"} {"global_step": 238082, "acc_step": 0, "speed/wps": 5518.209229019285, "speed/FLOPS": 243876603167369.2, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0463656447827816, "optim/lr": 3.2598998618356134e-06, "optim/total_tokens": 1997176569856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2643282413482666, "created_at": "2025-06-03T10:29:52.162475+00:00"} {"global_step": 238083, "acc_step": 0, "speed/wps": 5519.373527427315, "speed/FLOPS": 243928059197584.62, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.76 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.76, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04715162515640259, "optim/lr": 3.2563526367410666e-06, "optim/total_tokens": 1997184958464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.272788166999817, "created_at": "2025-06-03T10:29:55.135752+00:00"} {"global_step": 238084, "acc_step": 0, "speed/wps": 5528.316550222551, "speed/FLOPS": 244323295030593.84, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047691602259874344, "optim/lr": 3.25280541164652e-06, "optim/total_tokens": 1997193347072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2701833248138428, "created_at": "2025-06-03T10:29:58.104080+00:00"} {"global_step": 238085, "acc_step": 0, "speed/wps": 5514.957281485062, "speed/FLOPS": 243732883731332.9, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04745880886912346, "optim/lr": 3.2492581865521953e-06, "optim/total_tokens": 1997201735680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2589459419250488, "created_at": "2025-06-03T10:30:01.083039+00:00"} {"global_step": 238086, "acc_step": 0, "speed/wps": 5525.596341290518, "speed/FLOPS": 244203075719089.44, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04830912500619888, "optim/lr": 3.2457109614576485e-06, "optim/total_tokens": 1997210124288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2543220520019531, "created_at": "2025-06-03T10:30:04.053133+00:00"} {"global_step": 238087, "acc_step": 0, "speed/wps": 5507.847267032736, "speed/FLOPS": 243418657484893.16, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04646753892302513, "optim/lr": 3.2421637363631017e-06, "optim/total_tokens": 1997218512896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2659066915512085, "created_at": "2025-06-03T10:30:07.034418+00:00"} {"global_step": 238088, "acc_step": 0, "speed/wps": 5519.935394626397, "speed/FLOPS": 243952890851887.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046636950224637985, "optim/lr": 3.2386165112685553e-06, "optim/total_tokens": 1997226901504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.250610589981079, "created_at": "2025-06-03T10:30:10.010125+00:00"} {"global_step": 238089, "acc_step": 0, "speed/wps": 5522.470561871863, "speed/FLOPS": 244064932267974.3, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046606965363025665, "optim/lr": 3.2350692861742304e-06, "optim/total_tokens": 1997235290112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2551435232162476, "created_at": "2025-06-03T10:30:12.981466+00:00"} {"global_step": 238090, "acc_step": 0, "speed/wps": 5521.4395420876945, "speed/FLOPS": 244019366470751.75, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04658651351928711, "optim/lr": 3.2315220610796835e-06, "optim/total_tokens": 1997243678720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2701764106750488, "created_at": "2025-06-03T10:30:15.954564+00:00"} {"global_step": 238091, "acc_step": 0, "speed/wps": 5520.787309970836, "speed/FLOPS": 243990541149613.2, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04638170078396797, "optim/lr": 3.2279748359851367e-06, "optim/total_tokens": 1997252067328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.243316411972046, "created_at": "2025-06-03T10:30:18.926766+00:00"} {"global_step": 238092, "acc_step": 0, "speed/wps": 5523.856709284607, "speed/FLOPS": 244126192888672.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046697862446308136, "optim/lr": 3.22442761089059e-06, "optim/total_tokens": 1997260455936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.258248209953308, "created_at": "2025-06-03T10:30:21.902842+00:00"} {"global_step": 238093, "acc_step": 0, "speed/wps": 5520.96282186235, "speed/FLOPS": 243998297876866.84, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04669373482465744, "optim/lr": 3.2208803857962654e-06, "optim/total_tokens": 1997268844544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.243850588798523, "created_at": "2025-06-03T10:30:24.875387+00:00"} {"global_step": 238094, "acc_step": 0, "speed/wps": 5526.169248540442, "speed/FLOPS": 244228395287130.97, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 195.92, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04742734879255295, "optim/lr": 3.2173331607017186e-06, "optim/total_tokens": 1997277233152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2576961517333984, "created_at": "2025-06-03T10:30:27.848754+00:00"} {"global_step": 238095, "acc_step": 0, "speed/wps": 5515.936229583949, "speed/FLOPS": 243776148226593.12, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04681877791881561, "optim/lr": 3.213785935607172e-06, "optim/total_tokens": 1997285621760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2740395069122314, "created_at": "2025-06-03T10:30:30.827671+00:00"} {"global_step": 238096, "acc_step": 0, "speed/wps": 5504.91484299553, "speed/FLOPS": 243289059351955.5, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.75 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.75, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04694541543722153, "optim/lr": 3.210238710512625e-06, "optim/total_tokens": 1997294010368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2428700923919678, "created_at": "2025-06-03T10:30:33.812937+00:00"} {"global_step": 238097, "acc_step": 0, "speed/wps": 5521.725246752761, "speed/FLOPS": 244031993154578.66, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0468645840883255, "optim/lr": 3.2066914854183005e-06, "optim/total_tokens": 1997302398976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2491470575332642, "created_at": "2025-06-03T10:30:36.784612+00:00"} {"global_step": 238098, "acc_step": 0, "speed/wps": 5521.66999616119, "speed/FLOPS": 244029551361229.38, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04719405248761177, "optim/lr": 3.2031442603237537e-06, "optim/total_tokens": 1997310787584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2548761367797852, "created_at": "2025-06-03T10:30:39.758079+00:00"} {"global_step": 238099, "acc_step": 0, "speed/wps": 5526.292997342293, "speed/FLOPS": 244233864350769.03, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04647698253393173, "optim/lr": 3.199597035229207e-06, "optim/total_tokens": 1997319176192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2596997022628784, "created_at": "2025-06-03T10:30:42.727592+00:00"} {"global_step": 238100, "acc_step": 0, "speed/wps": 5517.191214245559, "speed/FLOPS": 243831612125042.5, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047439757734537125, "optim/lr": 3.1960498101348824e-06, "optim/total_tokens": 1997327564800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.257398009300232, "created_at": "2025-06-03T10:30:45.701674+00:00"} {"global_step": 238101, "acc_step": 0, "speed/wps": 5515.492444675154, "speed/FLOPS": 243756535205121.47, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04760614037513733, "optim/lr": 3.1925025850403356e-06, "optim/total_tokens": 1997335953408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2495472431182861, "created_at": "2025-06-03T10:30:48.677232+00:00"} {"global_step": 238102, "acc_step": 0, "speed/wps": 5512.579522292263, "speed/FLOPS": 243627798945486.06, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0462254174053669, "optim/lr": 3.1889553599457888e-06, "optim/total_tokens": 1997344342016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.26084303855896, "created_at": "2025-06-03T10:30:51.658497+00:00"} {"global_step": 238103, "acc_step": 0, "speed/wps": 5520.093239437265, "speed/FLOPS": 243959866784604.4, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0477675199508667, "optim/lr": 3.185408134851242e-06, "optim/total_tokens": 1997352730624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2561544179916382, "created_at": "2025-06-03T10:30:54.631023+00:00"} {"global_step": 238104, "acc_step": 0, "speed/wps": 5507.484102356894, "speed/FLOPS": 243402607465066.25, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04661058634519577, "optim/lr": 3.1818609097569175e-06, "optim/total_tokens": 1997361119232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2515939474105835, "created_at": "2025-06-03T10:30:57.614111+00:00"} {"global_step": 238105, "acc_step": 0, "speed/wps": 5502.9934906925, "speed/FLOPS": 243204145414534.16, "speed/curr_iter_time": 2.9763, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9763, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.85, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048981163650751114, "optim/lr": 3.1783136846623707e-06, "optim/total_tokens": 1997369507840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2542757987976074, "created_at": "2025-06-03T10:31:00.598969+00:00"} {"global_step": 238106, "acc_step": 0, "speed/wps": 5514.305988272378, "speed/FLOPS": 243704099904953.16, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04754004627466202, "optim/lr": 3.174766459567824e-06, "optim/total_tokens": 1997377896448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2718809843063354, "created_at": "2025-06-03T10:31:03.578275+00:00"} {"global_step": 238107, "acc_step": 0, "speed/wps": 5521.3271204224375, "speed/FLOPS": 244014398008573.62, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.74 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.74, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04679741710424423, "optim/lr": 3.171219234473277e-06, "optim/total_tokens": 1997386285056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2652086019515991, "created_at": "2025-06-03T10:31:06.556239+00:00"} {"global_step": 238108, "acc_step": 0, "speed/wps": 5523.327097610552, "speed/FLOPS": 244102786763477.06, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04713946208357811, "optim/lr": 3.1676720093789526e-06, "optim/total_tokens": 1997394673664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.268678069114685, "created_at": "2025-06-03T10:31:09.532555+00:00"} {"global_step": 238109, "acc_step": 0, "speed/wps": 5517.065998490241, "speed/FLOPS": 243826078229569.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04750495404005051, "optim/lr": 3.1641247842844057e-06, "optim/total_tokens": 1997403062272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2367380857467651, "created_at": "2025-06-03T10:31:12.508673+00:00"} {"global_step": 238110, "acc_step": 0, "speed/wps": 5513.195292216623, "speed/FLOPS": 243655012824346.56, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046473946422338486, "optim/lr": 3.160577559189859e-06, "optim/total_tokens": 1997411450880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.269292950630188, "created_at": "2025-06-03T10:31:15.485585+00:00"} {"global_step": 238111, "acc_step": 0, "speed/wps": 5510.88125530519, "speed/FLOPS": 243552744237175.84, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04697960987687111, "optim/lr": 3.157030334095312e-06, "optim/total_tokens": 1997419839488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2528843879699707, "created_at": "2025-06-03T10:31:18.468233+00:00"} {"global_step": 238112, "acc_step": 0, "speed/wps": 5502.838531612611, "speed/FLOPS": 243197297016355.56, "speed/curr_iter_time": 2.9764, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9764, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048680104315280914, "optim/lr": 3.1534831090009876e-06, "optim/total_tokens": 1997428228096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2739287614822388, "created_at": "2025-06-03T10:31:21.450003+00:00"} {"global_step": 238113, "acc_step": 0, "speed/wps": 5512.858070789571, "speed/FLOPS": 243640109363326.6, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.049002233892679214, "optim/lr": 3.149935883906441e-06, "optim/total_tokens": 1997436616704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2734416723251343, "created_at": "2025-06-03T10:31:24.427670+00:00"} {"global_step": 238114, "acc_step": 0, "speed/wps": 5505.879183122536, "speed/FLOPS": 243331678249628.94, "speed/curr_iter_time": 2.9734, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9734, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.09794088453054428, "optim/lr": 3.146388658811894e-06, "optim/total_tokens": 1997445005312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2623777389526367, "created_at": "2025-06-03T10:31:27.411622+00:00"} {"global_step": 238115, "acc_step": 0, "speed/wps": 5519.657776163502, "speed/FLOPS": 243940621536807.16, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.051366664469242096, "optim/lr": 3.142841433717347e-06, "optim/total_tokens": 1997453393920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2611725330352783, "created_at": "2025-06-03T10:31:30.384980+00:00"} {"global_step": 238116, "acc_step": 0, "speed/wps": 5523.600466862258, "speed/FLOPS": 244114868285171.78, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046813108026981354, "optim/lr": 3.1392942086230227e-06, "optim/total_tokens": 1997461782528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2696408033370972, "created_at": "2025-06-03T10:31:33.357159+00:00"} {"global_step": 238117, "acc_step": 0, "speed/wps": 5513.123130518712, "speed/FLOPS": 243651823646655.94, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048317570239305496, "optim/lr": 3.135746983528476e-06, "optim/total_tokens": 1997470171136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2651829719543457, "created_at": "2025-06-03T10:31:36.333672+00:00"} {"global_step": 238118, "acc_step": 0, "speed/wps": 5524.553605065221, "speed/FLOPS": 244156992115139.16, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04748294875025749, "optim/lr": 3.132199758433929e-06, "optim/total_tokens": 1997478559744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2670904397964478, "created_at": "2025-06-03T10:31:39.307737+00:00"} {"global_step": 238119, "acc_step": 0, "speed/wps": 5515.853411056095, "speed/FLOPS": 243772488071565.62, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0468708761036396, "optim/lr": 3.1286525333393823e-06, "optim/total_tokens": 1997486948352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2547122240066528, "created_at": "2025-06-03T10:31:42.282921+00:00"} {"global_step": 238120, "acc_step": 0, "speed/wps": 5521.528330530274, "speed/FLOPS": 244023290465453.3, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.73 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.73, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046444181352853775, "optim/lr": 3.1251053082450574e-06, "optim/total_tokens": 1997495336960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.253845453262329, "created_at": "2025-06-03T10:31:45.255885+00:00"} {"global_step": 238121, "acc_step": 0, "speed/wps": 5518.92685971548, "speed/FLOPS": 243908318770974.12, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04730277135968208, "optim/lr": 3.121558083150511e-06, "optim/total_tokens": 1997503725568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2441169023513794, "created_at": "2025-06-03T10:31:48.229278+00:00"} {"global_step": 238122, "acc_step": 0, "speed/wps": 5511.042349344638, "speed/FLOPS": 243559863769165.4, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04711524024605751, "optim/lr": 3.118010858055964e-06, "optim/total_tokens": 1997512114176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2601206302642822, "created_at": "2025-06-03T10:31:51.207094+00:00"} {"global_step": 238123, "acc_step": 0, "speed/wps": 5519.748375579914, "speed/FLOPS": 243944625567282.72, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04723859205842018, "optim/lr": 3.1144636329614173e-06, "optim/total_tokens": 1997520502784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.263956904411316, "created_at": "2025-06-03T10:31:54.179629+00:00"} {"global_step": 238124, "acc_step": 0, "speed/wps": 5523.633074532389, "speed/FLOPS": 244116309377290.4, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047152020037174225, "optim/lr": 3.1109164078670924e-06, "optim/total_tokens": 1997528891392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2549593448638916, "created_at": "2025-06-03T10:31:57.152767+00:00"} {"global_step": 238125, "acc_step": 0, "speed/wps": 5522.767954002801, "speed/FLOPS": 244078075477970.9, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046511102467775345, "optim/lr": 3.107369182772546e-06, "optim/total_tokens": 1997537280000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2521889209747314, "created_at": "2025-06-03T10:32:00.124235+00:00"} {"global_step": 238126, "acc_step": 0, "speed/wps": 5507.883604758546, "speed/FLOPS": 243420263426380.6, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04851975664496422, "optim/lr": 3.1038219576779992e-06, "optim/total_tokens": 1997545668608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2742570638656616, "created_at": "2025-06-03T10:32:03.106607+00:00"} {"global_step": 238127, "acc_step": 0, "speed/wps": 5527.595806168681, "speed/FLOPS": 244291441832515.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04804540425539017, "optim/lr": 3.1002747325836743e-06, "optim/total_tokens": 1997554057216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2647110223770142, "created_at": "2025-06-03T10:32:06.076136+00:00"} {"global_step": 238128, "acc_step": 0, "speed/wps": 5525.418292919868, "speed/FLOPS": 244195206892440.9, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04659351333975792, "optim/lr": 3.0967275074891275e-06, "optim/total_tokens": 1997562445824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2541481256484985, "created_at": "2025-06-03T10:32:09.048622+00:00"} {"global_step": 238129, "acc_step": 0, "speed/wps": 5513.575976493796, "speed/FLOPS": 243671837120878.8, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046278588473796844, "optim/lr": 3.093180282394581e-06, "optim/total_tokens": 1997570834432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2697991132736206, "created_at": "2025-06-03T10:32:12.029094+00:00"} {"global_step": 238130, "acc_step": 0, "speed/wps": 5511.252537505622, "speed/FLOPS": 243569153010040.38, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04630715399980545, "optim/lr": 3.0896330573000343e-06, "optim/total_tokens": 1997579223040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2583472728729248, "created_at": "2025-06-03T10:32:15.010368+00:00"} {"global_step": 238131, "acc_step": 0, "speed/wps": 5518.725009029501, "speed/FLOPS": 243899398003819.34, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.72 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.72, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046879157423973083, "optim/lr": 3.0860858322057094e-06, "optim/total_tokens": 1997587611648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2645061016082764, "created_at": "2025-06-03T10:32:17.983335+00:00"} {"global_step": 238132, "acc_step": 0, "speed/wps": 5526.784574503055, "speed/FLOPS": 244255589545154.7, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04811388999223709, "optim/lr": 3.0825386071111626e-06, "optim/total_tokens": 1997596000256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.264273762702942, "created_at": "2025-06-03T10:32:20.952965+00:00"} {"global_step": 238133, "acc_step": 0, "speed/wps": 5518.458710598859, "speed/FLOPS": 243887628976223.9, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04893997684121132, "optim/lr": 3.078991382016616e-06, "optim/total_tokens": 1997604388864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2690906524658203, "created_at": "2025-06-03T10:32:23.926223+00:00"} {"global_step": 238134, "acc_step": 0, "speed/wps": 5513.512203628528, "speed/FLOPS": 243669018686653.12, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04639231413602829, "optim/lr": 3.0754441569220694e-06, "optim/total_tokens": 1997612777472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2530498504638672, "created_at": "2025-06-03T10:32:26.904967+00:00"} {"global_step": 238135, "acc_step": 0, "speed/wps": 5518.144823174277, "speed/FLOPS": 243873756758678.84, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04759823530912399, "optim/lr": 3.0718969318277445e-06, "optim/total_tokens": 1997621166080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2547162771224976, "created_at": "2025-06-03T10:32:29.878528+00:00"} {"global_step": 238136, "acc_step": 0, "speed/wps": 5511.823221383918, "speed/FLOPS": 243594374316436.16, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04712697118520737, "optim/lr": 3.0683497067331977e-06, "optim/total_tokens": 1997629554688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.262070655822754, "created_at": "2025-06-03T10:32:32.856878+00:00"} {"global_step": 238137, "acc_step": 0, "speed/wps": 5505.837248715008, "speed/FLOPS": 243329824963455.97, "speed/curr_iter_time": 2.9748, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9748, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04646265506744385, "optim/lr": 3.064802481638651e-06, "optim/total_tokens": 1997637943296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2619898319244385, "created_at": "2025-06-03T10:32:35.840962+00:00"} {"global_step": 238138, "acc_step": 0, "speed/wps": 5522.804611972743, "speed/FLOPS": 244079695572609.84, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04745408147573471, "optim/lr": 3.0612552565441045e-06, "optim/total_tokens": 1997646331904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2663224935531616, "created_at": "2025-06-03T10:32:38.816678+00:00"} {"global_step": 238139, "acc_step": 0, "speed/wps": 5509.989186310656, "speed/FLOPS": 243513319353640.47, "speed/curr_iter_time": 2.9725, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9725, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04701698198914528, "optim/lr": 3.0577080314497796e-06, "optim/total_tokens": 1997654720512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2569880485534668, "created_at": "2025-06-03T10:32:41.798786+00:00"} {"global_step": 238140, "acc_step": 0, "speed/wps": 5520.753110791816, "speed/FLOPS": 243989029720947.78, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04698445647954941, "optim/lr": 3.0541608063552327e-06, "optim/total_tokens": 1997663109120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2475438117980957, "created_at": "2025-06-03T10:32:44.771345+00:00"} {"global_step": 238141, "acc_step": 0, "speed/wps": 5503.427080369464, "speed/FLOPS": 243223307858942.84, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04786999896168709, "optim/lr": 3.050613581260686e-06, "optim/total_tokens": 1997671497728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.262420415878296, "created_at": "2025-06-03T10:32:47.752824+00:00"} {"global_step": 238142, "acc_step": 0, "speed/wps": 5531.494439803704, "speed/FLOPS": 244463741484167.38, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047850869596004486, "optim/lr": 3.0470663561661395e-06, "optim/total_tokens": 1997679886336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2627735137939453, "created_at": "2025-06-03T10:32:50.720102+00:00"} {"global_step": 238143, "acc_step": 0, "speed/wps": 5514.746559983178, "speed/FLOPS": 243723570919520.06, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04703868553042412, "optim/lr": 3.0435191310718146e-06, "optim/total_tokens": 1997688274944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2707715034484863, "created_at": "2025-06-03T10:32:53.699309+00:00"} {"global_step": 238144, "acc_step": 0, "speed/wps": 5512.137751414571, "speed/FLOPS": 243608274933880.38, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.71 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.71, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04722907394170761, "optim/lr": 3.039971905977268e-06, "optim/total_tokens": 1997696663552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2607474327087402, "created_at": "2025-06-03T10:32:56.679754+00:00"} {"global_step": 238145, "acc_step": 0, "speed/wps": 5523.511139184075, "speed/FLOPS": 244110920459016.6, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04814084619283676, "optim/lr": 3.036424680882721e-06, "optim/total_tokens": 1997705052160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.266296148300171, "created_at": "2025-06-03T10:32:59.652964+00:00"} {"global_step": 238146, "acc_step": 0, "speed/wps": 5512.025962519502, "speed/FLOPS": 243603334436905.78, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04786122590303421, "optim/lr": 3.0328774557881746e-06, "optim/total_tokens": 1997713440768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2545781135559082, "created_at": "2025-06-03T10:33:02.633392+00:00"} {"global_step": 238147, "acc_step": 0, "speed/wps": 5521.739860931013, "speed/FLOPS": 244032639026455.25, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046967554837465286, "optim/lr": 3.0293302306938497e-06, "optim/total_tokens": 1997721829376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2649797201156616, "created_at": "2025-06-03T10:33:05.607503+00:00"} {"global_step": 238148, "acc_step": 0, "speed/wps": 5529.494423381073, "speed/FLOPS": 244375350995299.16, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04652503505349159, "optim/lr": 3.025783005599303e-06, "optim/total_tokens": 1997730217984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2563624382019043, "created_at": "2025-06-03T10:33:08.578475+00:00"} {"global_step": 238149, "acc_step": 0, "speed/wps": 5515.451341129002, "speed/FLOPS": 243754718638768.56, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04785134643316269, "optim/lr": 3.022235780504756e-06, "optim/total_tokens": 1997738606592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2593059539794922, "created_at": "2025-06-03T10:33:11.557200+00:00"} {"global_step": 238150, "acc_step": 0, "speed/wps": 5531.913681250956, "speed/FLOPS": 244482269810263.66, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.049838196486234665, "optim/lr": 3.0186885554102097e-06, "optim/total_tokens": 1997746995200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 417, "loss/out": 1.2419167757034302, "created_at": "2025-06-03T10:33:14.523709+00:00"} {"global_step": 238151, "acc_step": 0, "speed/wps": 5517.199877768627, "speed/FLOPS": 243831995008418.12, "speed/curr_iter_time": 2.9675, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9675, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04764433205127716, "optim/lr": 3.0151413303158848e-06, "optim/total_tokens": 1997755383808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2433058023452759, "created_at": "2025-06-03T10:33:17.502613+00:00"} {"global_step": 238152, "acc_step": 0, "speed/wps": 5528.305142063098, "speed/FLOPS": 244322790848338.28, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04638335481286049, "optim/lr": 3.011594105221338e-06, "optim/total_tokens": 1997763772416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.255041241645813, "created_at": "2025-06-03T10:33:20.471586+00:00"} {"global_step": 238153, "acc_step": 0, "speed/wps": 5527.709458953195, "speed/FLOPS": 244296464703863.12, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04858814552426338, "optim/lr": 3.008046880126791e-06, "optim/total_tokens": 1997772161024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.254717469215393, "created_at": "2025-06-03T10:33:23.439937+00:00"} {"global_step": 238154, "acc_step": 0, "speed/wps": 5518.964098669522, "speed/FLOPS": 243909964542136.56, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046733081340789795, "optim/lr": 3.0044996550324667e-06, "optim/total_tokens": 1997780549632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2594056129455566, "created_at": "2025-06-03T10:33:26.412789+00:00"} {"global_step": 238155, "acc_step": 0, "speed/wps": 5524.682759716935, "speed/FLOPS": 244162700089671.5, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.7 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.7, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04813048616051674, "optim/lr": 3.00095242993792e-06, "optim/total_tokens": 1997788938240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2679332494735718, "created_at": "2025-06-03T10:33:29.385524+00:00"} {"global_step": 238156, "acc_step": 0, "speed/wps": 5531.768610742682, "speed/FLOPS": 244475858436336.12, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04783358797430992, "optim/lr": 2.997405204843373e-06, "optim/total_tokens": 1997797326848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2688175439834595, "created_at": "2025-06-03T10:33:32.354592+00:00"} {"global_step": 238157, "acc_step": 0, "speed/wps": 5523.084624820723, "speed/FLOPS": 244092070707254.84, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047757141292095184, "optim/lr": 2.9938579797488262e-06, "optim/total_tokens": 1997805715456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2748862504959106, "created_at": "2025-06-03T10:33:35.325477+00:00"} {"global_step": 238158, "acc_step": 0, "speed/wps": 5530.8643624037095, "speed/FLOPS": 244435895288116.12, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 195.83, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047858960926532745, "optim/lr": 2.9903107546545018e-06, "optim/total_tokens": 1997814104064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.249651312828064, "created_at": "2025-06-03T10:33:38.292532+00:00"} {"global_step": 238159, "acc_step": 0, "speed/wps": 5528.158017203777, "speed/FLOPS": 244316288682609.56, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048272330313920975, "optim/lr": 2.986763529559955e-06, "optim/total_tokens": 1997822492672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2684396505355835, "created_at": "2025-06-03T10:33:41.260851+00:00"} {"global_step": 238160, "acc_step": 0, "speed/wps": 5535.58236900897, "speed/FLOPS": 244644407031121.66, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04966888204216957, "optim/lr": 2.983216304465408e-06, "optim/total_tokens": 1997830881280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2689036130905151, "created_at": "2025-06-03T10:33:44.228160+00:00"} {"global_step": 238161, "acc_step": 0, "speed/wps": 5525.51225751029, "speed/FLOPS": 244199359646383.2, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048338960856199265, "optim/lr": 2.9796690793708613e-06, "optim/total_tokens": 1997839269888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2641361951828003, "created_at": "2025-06-03T10:33:47.201768+00:00"} {"global_step": 238162, "acc_step": 0, "speed/wps": 5527.844927436355, "speed/FLOPS": 244302451717428.22, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0480915866792202, "optim/lr": 2.976121854276537e-06, "optim/total_tokens": 1997847658496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2463316917419434, "created_at": "2025-06-03T10:33:50.173833+00:00"} {"global_step": 238163, "acc_step": 0, "speed/wps": 5522.749101385812, "speed/FLOPS": 244077242288796.4, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046567853540182114, "optim/lr": 2.97257462918199e-06, "optim/total_tokens": 1997856047104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.25627601146698, "created_at": "2025-06-03T10:33:53.145001+00:00"} {"global_step": 238164, "acc_step": 0, "speed/wps": 5508.052387534778, "speed/FLOPS": 243427722761181.47, "speed/curr_iter_time": 2.9735, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9735, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046575818210840225, "optim/lr": 2.969027404087443e-06, "optim/total_tokens": 1997864435712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2575962543487549, "created_at": "2025-06-03T10:33:56.127487+00:00"} {"global_step": 238165, "acc_step": 0, "speed/wps": 5514.408252087446, "speed/FLOPS": 243708619442145.5, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04647652059793472, "optim/lr": 2.9654801789928964e-06, "optim/total_tokens": 1997872824320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2757313251495361, "created_at": "2025-06-03T10:33:59.106713+00:00"} {"global_step": 238166, "acc_step": 0, "speed/wps": 5527.912462023293, "speed/FLOPS": 244305436400497.53, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0465388298034668, "optim/lr": 2.961932953898572e-06, "optim/total_tokens": 1997881212928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2564648389816284, "created_at": "2025-06-03T10:34:02.075948+00:00"} {"global_step": 238167, "acc_step": 0, "speed/wps": 5526.735520500397, "speed/FLOPS": 244253421609318.34, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047719720751047134, "optim/lr": 2.958385728804025e-06, "optim/total_tokens": 1997889601536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2544448375701904, "created_at": "2025-06-03T10:34:05.046577+00:00"} {"global_step": 238168, "acc_step": 0, "speed/wps": 5526.475526991668, "speed/FLOPS": 244241931226999.94, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04683474078774452, "optim/lr": 2.9548385037094783e-06, "optim/total_tokens": 1997897990144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2525559663772583, "created_at": "2025-06-03T10:34:08.015500+00:00"} {"global_step": 238169, "acc_step": 0, "speed/wps": 5515.213457434983, "speed/FLOPS": 243744205397092.06, "speed/curr_iter_time": 2.9697, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9697, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.69 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.69, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047064408659935, "optim/lr": 2.9512912786149315e-06, "optim/total_tokens": 1997906378752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2594425678253174, "created_at": "2025-06-03T10:34:10.996405+00:00"} {"global_step": 238170, "acc_step": 0, "speed/wps": 5527.20810837693, "speed/FLOPS": 244274307574537.06, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04762569069862366, "optim/lr": 2.947744053520607e-06, "optim/total_tokens": 1997914767360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2716503143310547, "created_at": "2025-06-03T10:34:13.965048+00:00"} {"global_step": 238171, "acc_step": 0, "speed/wps": 5529.248644759761, "speed/FLOPS": 244364488838246.2, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046650249511003494, "optim/lr": 2.94419682842606e-06, "optim/total_tokens": 1997923155968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.265106439590454, "created_at": "2025-06-03T10:34:16.935944+00:00"} {"global_step": 238172, "acc_step": 0, "speed/wps": 5523.918766026822, "speed/FLOPS": 244128935479042.7, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04619058966636658, "optim/lr": 2.9406496033315133e-06, "optim/total_tokens": 1997931544576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2523956298828125, "created_at": "2025-06-03T10:34:19.909711+00:00"} {"global_step": 238173, "acc_step": 0, "speed/wps": 5514.438653285563, "speed/FLOPS": 243709963019494.84, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050105366855859756, "optim/lr": 2.9371023782369665e-06, "optim/total_tokens": 1997939933184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.262259602546692, "created_at": "2025-06-03T10:34:22.885150+00:00"} {"global_step": 238174, "acc_step": 0, "speed/wps": 5529.74985153614, "speed/FLOPS": 244386639612353.3, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047815144062042236, "optim/lr": 2.933555153142642e-06, "optim/total_tokens": 1997948321792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2642418146133423, "created_at": "2025-06-03T10:34:25.852300+00:00"} {"global_step": 238175, "acc_step": 0, "speed/wps": 5529.487619099588, "speed/FLOPS": 244375050280885.0, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046847160905599594, "optim/lr": 2.9300079280480952e-06, "optim/total_tokens": 1997956710400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2503236532211304, "created_at": "2025-06-03T10:34:28.820262+00:00"} {"global_step": 238176, "acc_step": 0, "speed/wps": 5534.447434867657, "speed/FLOPS": 244594248751195.16, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.79, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046975597739219666, "optim/lr": 2.9264607029535484e-06, "optim/total_tokens": 1997965099008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.260435700416565, "created_at": "2025-06-03T10:34:31.786698+00:00"} {"global_step": 238177, "acc_step": 0, "speed/wps": 5523.444390169367, "speed/FLOPS": 244107970494218.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04701629653573036, "optim/lr": 2.9229134778590016e-06, "optim/total_tokens": 1997973487616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.277158260345459, "created_at": "2025-06-03T10:34:34.757234+00:00"} {"global_step": 238178, "acc_step": 0, "speed/wps": 5525.061924332994, "speed/FLOPS": 244179457224960.84, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04841132462024689, "optim/lr": 2.919366252764677e-06, "optim/total_tokens": 1997981876224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2611758708953857, "created_at": "2025-06-03T10:34:37.731260+00:00"} {"global_step": 238179, "acc_step": 0, "speed/wps": 5532.145896005233, "speed/FLOPS": 244492532513819.84, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04688204452395439, "optim/lr": 2.9158190276701303e-06, "optim/total_tokens": 1997990264832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2519640922546387, "created_at": "2025-06-03T10:34:40.697380+00:00"} {"global_step": 238180, "acc_step": 0, "speed/wps": 5545.428781194297, "speed/FLOPS": 245079568051206.8, "speed/curr_iter_time": 2.9536, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9536, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 195.41, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0465899221599102, "optim/lr": 2.9122718025755835e-06, "optim/total_tokens": 1997998653440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2645817995071411, "created_at": "2025-06-03T10:34:43.659546+00:00"} {"global_step": 238181, "acc_step": 0, "speed/wps": 5522.419912832242, "speed/FLOPS": 244062693839668.38, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047348249703645706, "optim/lr": 2.9087245774812586e-06, "optim/total_tokens": 1998007042048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2766947746276855, "created_at": "2025-06-03T10:34:46.634018+00:00"} {"global_step": 238182, "acc_step": 0, "speed/wps": 5501.06154321533, "speed/FLOPS": 243118763224646.84, "speed/curr_iter_time": 2.9758, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9758, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 196.88, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04748259484767914, "optim/lr": 2.9051773523867118e-06, "optim/total_tokens": 1998015430656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2453701496124268, "created_at": "2025-06-03T10:34:49.619452+00:00"} {"global_step": 238183, "acc_step": 0, "speed/wps": 5538.703470736161, "speed/FLOPS": 244782343752216.66, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048360224813222885, "optim/lr": 2.9016301272921654e-06, "optim/total_tokens": 1998023819264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2701447010040283, "created_at": "2025-06-03T10:34:52.586009+00:00"} {"global_step": 238184, "acc_step": 0, "speed/wps": 5523.7412450380925, "speed/FLOPS": 244121089959975.66, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04604267701506615, "optim/lr": 2.8980829021976186e-06, "optim/total_tokens": 1998032207872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2721275091171265, "created_at": "2025-06-03T10:34:55.561492+00:00"} {"global_step": 238185, "acc_step": 0, "speed/wps": 5523.168617391928, "speed/FLOPS": 244095782748989.16, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04675175994634628, "optim/lr": 2.8945356771032937e-06, "optim/total_tokens": 1998040596480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2599421739578247, "created_at": "2025-06-03T10:34:58.537684+00:00"} {"global_step": 238186, "acc_step": 0, "speed/wps": 5525.4120787370575, "speed/FLOPS": 244194932257367.75, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04608255252242088, "optim/lr": 2.890988452008747e-06, "optim/total_tokens": 1998048985088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2682344913482666, "created_at": "2025-06-03T10:35:01.510164+00:00"} {"global_step": 238187, "acc_step": 0, "speed/wps": 5528.842587563196, "speed/FLOPS": 244346543188547.12, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048470109701156616, "optim/lr": 2.8874412269142005e-06, "optim/total_tokens": 1998057373696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2644699811935425, "created_at": "2025-06-03T10:35:04.478512+00:00"} {"global_step": 238188, "acc_step": 0, "speed/wps": 5518.748718918985, "speed/FLOPS": 243900445859576.3, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04660097137093544, "optim/lr": 2.8838940018196536e-06, "optim/total_tokens": 1998065762304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2638609409332275, "created_at": "2025-06-03T10:35:07.454554+00:00"} {"global_step": 238189, "acc_step": 0, "speed/wps": 5523.323299434353, "speed/FLOPS": 244102618903529.9, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046793606132268906, "optim/lr": 2.8803467767253288e-06, "optim/total_tokens": 1998074150912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2668489217758179, "created_at": "2025-06-03T10:35:10.428655+00:00"} {"global_step": 238190, "acc_step": 0, "speed/wps": 5536.895811970055, "speed/FLOPS": 244702454487191.1, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 195.72, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04721961170434952, "optim/lr": 2.876799551630782e-06, "optim/total_tokens": 1998082539520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.2556074857711792, "created_at": "2025-06-03T10:35:13.393936+00:00"} {"global_step": 238191, "acc_step": 0, "speed/wps": 5532.834365641592, "speed/FLOPS": 244522959347839.88, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.67 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.67, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04703047499060631, "optim/lr": 2.8732523265362355e-06, "optim/total_tokens": 1998090928128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.246801733970642, "created_at": "2025-06-03T10:35:16.359600+00:00"} {"global_step": 238192, "acc_step": 0, "speed/wps": 5403.974262787739, "speed/FLOPS": 238828002367497.03, "speed/curr_iter_time": 3.0294, "speed/data_load_time": 0.0007, "speed/curr_step_time": 3.0294, "speed/est_time_elapsed": "8.35 days", "speed/est_time_remaining": "0.68 hours", "speed/est_time_elapsed_hrs": 200.44, "speed/est_time_elapsed_days": 8.35, "speed/est_time_remaining_hrs": 0.68, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04729423299431801, "optim/lr": 2.8697051014416887e-06, "optim/total_tokens": 1998099316736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 356, "loss/out": 1.2541420459747314, "created_at": "2025-06-03T10:35:19.396594+00:00"} {"global_step": 238193, "acc_step": 0, "speed/wps": 5519.861032158084, "speed/FLOPS": 243949604411409.2, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0012, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.056921813637018204, "optim/lr": 2.866157876347364e-06, "optim/total_tokens": 1998107705344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2349677085876465, "created_at": "2025-06-03T10:35:22.371329+00:00"} {"global_step": 238194, "acc_step": 0, "speed/wps": 5527.227278853056, "speed/FLOPS": 244275154811458.47, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0009, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05416053906083107, "optim/lr": 2.862610651252817e-06, "optim/total_tokens": 1998116093952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.249058485031128, "created_at": "2025-06-03T10:35:25.340298+00:00"} {"global_step": 238195, "acc_step": 0, "speed/wps": 5519.411274161397, "speed/FLOPS": 243929727410025.75, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04944804310798645, "optim/lr": 2.8590634261582706e-06, "optim/total_tokens": 1998124482560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.270379662513733, "created_at": "2025-06-03T10:35:28.315706+00:00"} {"global_step": 238196, "acc_step": 0, "speed/wps": 5511.643968774619, "speed/FLOPS": 243586452268603.16, "speed/curr_iter_time": 2.9714, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9714, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048372745513916016, "optim/lr": 2.855516201063724e-06, "optim/total_tokens": 1998132871168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2451930046081543, "created_at": "2025-06-03T10:35:31.296629+00:00"} {"global_step": 238197, "acc_step": 0, "speed/wps": 5511.084381205466, "speed/FLOPS": 243561721362275.44, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050485216081142426, "optim/lr": 2.851968975969399e-06, "optim/total_tokens": 1998141259776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2471882104873657, "created_at": "2025-06-03T10:35:34.278109+00:00"} {"global_step": 238198, "acc_step": 0, "speed/wps": 5530.580715246334, "speed/FLOPS": 244423359535597.88, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 195.94, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05489050969481468, "optim/lr": 2.848421750874852e-06, "optim/total_tokens": 1998149648384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2548637390136719, "created_at": "2025-06-03T10:35:37.248681+00:00"} {"global_step": 238199, "acc_step": 0, "speed/wps": 5529.964287787203, "speed/FLOPS": 244396116597066.03, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05229952186346054, "optim/lr": 2.8448745257803053e-06, "optim/total_tokens": 1998158036992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.266654372215271, "created_at": "2025-06-03T10:35:40.215733+00:00"} {"global_step": 238200, "acc_step": 0, "speed/wps": 5539.043806225563, "speed/FLOPS": 244797384838853.28, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050959739834070206, "optim/lr": 2.841327300685759e-06, "optim/total_tokens": 1998166425600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2509241104125977, "created_at": "2025-06-03T10:35:43.177623+00:00"} {"global_step": 238201, "acc_step": 0, "speed/wps": 5539.018852123803, "speed/FLOPS": 244796281995282.2, "speed/curr_iter_time": 2.9569, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9569, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 195.65, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05089949816465378, "optim/lr": 2.837780075591434e-06, "optim/total_tokens": 1998174814208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2458841800689697, "created_at": "2025-06-03T10:35:46.139764+00:00"} {"global_step": 238202, "acc_step": 0, "speed/wps": 5527.874940240373, "speed/FLOPS": 244303778129746.34, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050142399966716766, "optim/lr": 2.834232850496887e-06, "optim/total_tokens": 1998183202816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2562055587768555, "created_at": "2025-06-03T10:35:49.112249+00:00"} {"global_step": 238203, "acc_step": 0, "speed/wps": 5516.958263575432, "speed/FLOPS": 243821316897772.5, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048913903534412384, "optim/lr": 2.8306856254023403e-06, "optim/total_tokens": 1998191591424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2641563415527344, "created_at": "2025-06-03T10:35:52.092542+00:00"} {"global_step": 238204, "acc_step": 0, "speed/wps": 5521.08307011255, "speed/FLOPS": 244003612234039.3, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.66 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.66, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050042275339365005, "optim/lr": 2.827138400307794e-06, "optim/total_tokens": 1998199980032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2521811723709106, "created_at": "2025-06-03T10:35:55.064967+00:00"} {"global_step": 238205, "acc_step": 0, "speed/wps": 5523.400450994284, "speed/FLOPS": 244106028607581.38, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04866807535290718, "optim/lr": 2.823591175213469e-06, "optim/total_tokens": 1998208368640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2451179027557373, "created_at": "2025-06-03T10:35:58.036684+00:00"} {"global_step": 238206, "acc_step": 0, "speed/wps": 5524.533221794338, "speed/FLOPS": 244156091278897.2, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047781143337488174, "optim/lr": 2.8200439501189222e-06, "optim/total_tokens": 1998216757248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2425565719604492, "created_at": "2025-06-03T10:36:01.009015+00:00"} {"global_step": 238207, "acc_step": 0, "speed/wps": 5513.3690953500145, "speed/FLOPS": 243662694033237.38, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047214869409799576, "optim/lr": 2.8164967250243754e-06, "optim/total_tokens": 1998225145856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2357289791107178, "created_at": "2025-06-03T10:36:03.987247+00:00"} {"global_step": 238208, "acc_step": 0, "speed/wps": 5528.829350159248, "speed/FLOPS": 244345958163047.8, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04789891466498375, "optim/lr": 2.812949499930051e-06, "optim/total_tokens": 1998233534464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2417569160461426, "created_at": "2025-06-03T10:36:06.954680+00:00"} {"global_step": 238209, "acc_step": 0, "speed/wps": 5542.501291564196, "speed/FLOPS": 244950187993806.66, "speed/curr_iter_time": 2.9542, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9542, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 195.48, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04882184788584709, "optim/lr": 2.809402274835504e-06, "optim/total_tokens": 1998241923072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2459696531295776, "created_at": "2025-06-03T10:36:09.918421+00:00"} {"global_step": 238210, "acc_step": 0, "speed/wps": 5515.630516802409, "speed/FLOPS": 243762637286428.94, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.050295960158109665, "optim/lr": 2.8058550497409573e-06, "optim/total_tokens": 1998250311680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.245351791381836, "created_at": "2025-06-03T10:36:12.897362+00:00"} {"global_step": 238211, "acc_step": 0, "speed/wps": 5514.247157821742, "speed/FLOPS": 243701499900156.6, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.049263276159763336, "optim/lr": 2.8023078246464105e-06, "optim/total_tokens": 1998258700288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2545610666275024, "created_at": "2025-06-03T10:36:15.878012+00:00"} {"global_step": 238212, "acc_step": 0, "speed/wps": 5521.529854271778, "speed/FLOPS": 244023357807028.6, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04861859604716301, "optim/lr": 2.798760599552086e-06, "optim/total_tokens": 1998267088896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.253967523574829, "created_at": "2025-06-03T10:36:18.850206+00:00"} {"global_step": 238213, "acc_step": 0, "speed/wps": 5522.224885911013, "speed/FLOPS": 244054074647988.34, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04905732348561287, "optim/lr": 2.795213374457539e-06, "optim/total_tokens": 1998275477504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2495006322860718, "created_at": "2025-06-03T10:36:21.824489+00:00"} {"global_step": 238214, "acc_step": 0, "speed/wps": 5523.953062110413, "speed/FLOPS": 244130451190394.16, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0474364347755909, "optim/lr": 2.7916661493629924e-06, "optim/total_tokens": 1998283866112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.246626853942871, "created_at": "2025-06-03T10:36:24.795427+00:00"} {"global_step": 238215, "acc_step": 0, "speed/wps": 5532.714662472831, "speed/FLOPS": 244517669080477.0, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.65 hours", "speed/est_time_elapsed_hrs": 195.81, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.65, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04823683574795723, "optim/lr": 2.7881189242684456e-06, "optim/total_tokens": 1998292254720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2568738460540771, "created_at": "2025-06-03T10:36:27.761984+00:00"} {"global_step": 238216, "acc_step": 0, "speed/wps": 5539.745957364292, "speed/FLOPS": 244828416325249.78, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04896065220236778, "optim/lr": 2.784571699174121e-06, "optim/total_tokens": 1998300643328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2602256536483765, "created_at": "2025-06-03T10:36:30.723753+00:00"} {"global_step": 238217, "acc_step": 0, "speed/wps": 5530.093589944161, "speed/FLOPS": 244401831090575.16, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047374628484249115, "optim/lr": 2.7810244740795743e-06, "optim/total_tokens": 1998309031936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.250357747077942, "created_at": "2025-06-03T10:36:33.691868+00:00"} {"global_step": 238218, "acc_step": 0, "speed/wps": 5526.180342797996, "speed/FLOPS": 244228885596529.28, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04963847994804382, "optim/lr": 2.7774772489850275e-06, "optim/total_tokens": 1998317420544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2455230951309204, "created_at": "2025-06-03T10:36:36.661624+00:00"} {"global_step": 238219, "acc_step": 0, "speed/wps": 5530.167733354323, "speed/FLOPS": 244405107849803.94, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047970280051231384, "optim/lr": 2.7739300238904806e-06, "optim/total_tokens": 1998325809152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2665718793869019, "created_at": "2025-06-03T10:36:39.629243+00:00"} {"global_step": 238220, "acc_step": 0, "speed/wps": 5531.576423334167, "speed/FLOPS": 244467364736584.1, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0483119823038578, "optim/lr": 2.770382798796156e-06, "optim/total_tokens": 1998334197760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2507598400115967, "created_at": "2025-06-03T10:36:42.598754+00:00"} {"global_step": 238221, "acc_step": 0, "speed/wps": 5522.890899021249, "speed/FLOPS": 244083509018496.66, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04966640844941139, "optim/lr": 2.7668355737016094e-06, "optim/total_tokens": 1998342586368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.251208782196045, "created_at": "2025-06-03T10:36:45.575663+00:00"} {"global_step": 238222, "acc_step": 0, "speed/wps": 5522.716888176494, "speed/FLOPS": 244075818629826.7, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048145998269319534, "optim/lr": 2.7632883486070625e-06, "optim/total_tokens": 1998350974976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.247889757156372, "created_at": "2025-06-03T10:36:48.547394+00:00"} {"global_step": 238223, "acc_step": 0, "speed/wps": 5523.9394088436275, "speed/FLOPS": 244129847785886.0, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0473465770483017, "optim/lr": 2.7597411235125157e-06, "optim/total_tokens": 1998359363584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.236936330795288, "created_at": "2025-06-03T10:36:51.518265+00:00"} {"global_step": 238224, "acc_step": 0, "speed/wps": 5531.306741912571, "speed/FLOPS": 244455446198104.2, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046888671815395355, "optim/lr": 2.7561938984181912e-06, "optim/total_tokens": 1998367752192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.252217173576355, "created_at": "2025-06-03T10:36:54.484721+00:00"} {"global_step": 238225, "acc_step": 0, "speed/wps": 5540.216306853048, "speed/FLOPS": 244849203365185.88, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.63, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0474201962351799, "optim/lr": 2.7526466733236444e-06, "optim/total_tokens": 1998376140800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2584820985794067, "created_at": "2025-06-03T10:36:57.446403+00:00"} {"global_step": 238226, "acc_step": 0, "speed/wps": 5533.090445298443, "speed/FLOPS": 244534276757938.2, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04813708737492561, "optim/lr": 2.7490994482290976e-06, "optim/total_tokens": 1998384529408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2409555912017822, "created_at": "2025-06-03T10:37:00.416864+00:00"} {"global_step": 238227, "acc_step": 0, "speed/wps": 5523.091329254842, "speed/FLOPS": 244092367008926.53, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047502551227808, "optim/lr": 2.745552223134551e-06, "optim/total_tokens": 1998392918016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2416969537734985, "created_at": "2025-06-03T10:37:03.390751+00:00"} {"global_step": 238228, "acc_step": 0, "speed/wps": 5538.8611682758865, "speed/FLOPS": 244789313176303.38, "speed/curr_iter_time": 2.957, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.957, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 195.68, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047460030764341354, "optim/lr": 2.7420049980402263e-06, "optim/total_tokens": 1998401306624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2593464851379395, "created_at": "2025-06-03T10:37:06.354591+00:00"} {"global_step": 238229, "acc_step": 0, "speed/wps": 5515.164734837222, "speed/FLOPS": 243742052107655.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.64 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.64, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048354003578424454, "optim/lr": 2.7384577729456795e-06, "optim/total_tokens": 1998409695232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.245389461517334, "created_at": "2025-06-03T10:37:09.332095+00:00"} {"global_step": 238230, "acc_step": 0, "speed/wps": 5518.153651097323, "speed/FLOPS": 243874146907692.06, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04743088781833649, "optim/lr": 2.7349105478511327e-06, "optim/total_tokens": 1998418083840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.269116997718811, "created_at": "2025-06-03T10:37:12.305916+00:00"} {"global_step": 238231, "acc_step": 0, "speed/wps": 5515.571251277264, "speed/FLOPS": 243760018053566.0, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048378318548202515, "optim/lr": 2.731363322756586e-06, "optim/total_tokens": 1998426472448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2682300806045532, "created_at": "2025-06-03T10:37:15.286741+00:00"} {"global_step": 238232, "acc_step": 0, "speed/wps": 5506.894193009141, "speed/FLOPS": 243376536491325.3, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047729093581438065, "optim/lr": 2.7278160976622614e-06, "optim/total_tokens": 1998434861056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2615103721618652, "created_at": "2025-06-03T10:37:18.266899+00:00"} {"global_step": 238233, "acc_step": 0, "speed/wps": 5534.072467842117, "speed/FLOPS": 244577677127921.5, "speed/curr_iter_time": 2.9596, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9596, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.048628177493810654, "optim/lr": 2.7242688725677146e-06, "optim/total_tokens": 1998443249664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.237539529800415, "created_at": "2025-06-03T10:37:21.231520+00:00"} {"global_step": 238234, "acc_step": 0, "speed/wps": 5525.530420906979, "speed/FLOPS": 244200162375548.16, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047934722155332565, "optim/lr": 2.7207216474731678e-06, "optim/total_tokens": 1998451638272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2607296705245972, "created_at": "2025-06-03T10:37:24.205525+00:00"} {"global_step": 238235, "acc_step": 0, "speed/wps": 5511.406545044546, "speed/FLOPS": 243575959354978.75, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.049394622445106506, "optim/lr": 2.717174422378843e-06, "optim/total_tokens": 1998460026880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2627941370010376, "created_at": "2025-06-03T10:37:27.183310+00:00"} {"global_step": 238236, "acc_step": 0, "speed/wps": 5532.654061371671, "speed/FLOPS": 244514990821990.25, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.0467931292951107, "optim/lr": 2.7136271972842965e-06, "optim/total_tokens": 1998468415488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.259089469909668, "created_at": "2025-06-03T10:37:30.149521+00:00"} {"global_step": 238237, "acc_step": 0, "speed/wps": 5533.041206204682, "speed/FLOPS": 244532100642022.47, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04811916500329971, "optim/lr": 2.7100799721897497e-06, "optim/total_tokens": 1998476804096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2451823949813843, "created_at": "2025-06-03T10:37:33.116373+00:00"} {"global_step": 238238, "acc_step": 0, "speed/wps": 5526.825129606351, "speed/FLOPS": 244257381873140.53, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047292813658714294, "optim/lr": 2.706532747095203e-06, "optim/total_tokens": 1998485192704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2412512302398682, "created_at": "2025-06-03T10:37:36.086753+00:00"} {"global_step": 238239, "acc_step": 0, "speed/wps": 5525.965608866356, "speed/FLOPS": 244219395455858.72, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.05051714554429054, "optim/lr": 2.702985522000878e-06, "optim/total_tokens": 1998493581312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2488198280334473, "created_at": "2025-06-03T10:37:39.060176+00:00"} {"global_step": 238240, "acc_step": 0, "speed/wps": 5528.3094213660315, "speed/FLOPS": 244322979971624.47, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04690677672624588, "optim/lr": 2.6994382969063316e-06, "optim/total_tokens": 1998501969920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.259506344795227, "created_at": "2025-06-03T10:37:42.029710+00:00"} {"global_step": 238241, "acc_step": 0, "speed/wps": 5514.265666380687, "speed/FLOPS": 243702317883726.6, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.63 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.63, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04715752974152565, "optim/lr": 2.6958910718117847e-06, "optim/total_tokens": 1998510358528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2624989748001099, "created_at": "2025-06-03T10:37:45.008520+00:00"} {"global_step": 238242, "acc_step": 0, "speed/wps": 5531.262018433243, "speed/FLOPS": 244453469649233.4, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04792935028672218, "optim/lr": 2.692343846717238e-06, "optim/total_tokens": 1998518747136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2408720254898071, "created_at": "2025-06-03T10:37:47.979501+00:00"} {"global_step": 238243, "acc_step": 0, "speed/wps": 5532.566252769812, "speed/FLOPS": 244511110131233.28, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047426674515008926, "optim/lr": 2.688796621622913e-06, "optim/total_tokens": 1998527135744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2575289011001587, "created_at": "2025-06-03T10:37:50.949857+00:00"} {"global_step": 238244, "acc_step": 0, "speed/wps": 5506.171556610795, "speed/FLOPS": 243344599661306.8, "speed/curr_iter_time": 2.9746, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9746, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.86, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04790313169360161, "optim/lr": 2.6852493965283666e-06, "optim/total_tokens": 1998535524352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2652177810668945, "created_at": "2025-06-03T10:37:53.930624+00:00"} {"global_step": 238245, "acc_step": 0, "speed/wps": 5526.618530420798, "speed/FLOPS": 244248251246609.6, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04763542860746384, "optim/lr": 2.68170217143382e-06, "optim/total_tokens": 1998543912960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2523061037063599, "created_at": "2025-06-03T10:37:56.903642+00:00"} {"global_step": 238246, "acc_step": 0, "speed/wps": 5523.866453514023, "speed/FLOPS": 244126623533736.72, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04787592962384224, "optim/lr": 2.678154946339273e-06, "optim/total_tokens": 1998552301568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.276247262954712, "created_at": "2025-06-03T10:37:59.874074+00:00"} {"global_step": 238247, "acc_step": 0, "speed/wps": 5520.738863063634, "speed/FLOPS": 243988400044288.62, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04760412871837616, "optim/lr": 2.674607721244948e-06, "optim/total_tokens": 1998560690176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2514604330062866, "created_at": "2025-06-03T10:38:02.849358+00:00"} {"global_step": 238248, "acc_step": 0, "speed/wps": 5516.475291977953, "speed/FLOPS": 243799972025236.66, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04737231880426407, "optim/lr": 2.6710604961504013e-06, "optim/total_tokens": 1998569078784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2485857009887695, "created_at": "2025-06-03T10:38:05.825084+00:00"} {"global_step": 238249, "acc_step": 0, "speed/wps": 5514.63661044199, "speed/FLOPS": 243718711712572.34, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04787518084049225, "optim/lr": 2.667513271055855e-06, "optim/total_tokens": 1998577467392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2399567365646362, "created_at": "2025-06-03T10:38:08.800287+00:00"} {"global_step": 238250, "acc_step": 0, "speed/wps": 5526.706399913707, "speed/FLOPS": 244252134628439.34, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04797757416963577, "optim/lr": 2.663966045961308e-06, "optim/total_tokens": 1998585856000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2408761978149414, "created_at": "2025-06-03T10:38:11.771395+00:00"} {"global_step": 238251, "acc_step": 0, "speed/wps": 5533.436188654956, "speed/FLOPS": 244549556844621.12, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04837659373879433, "optim/lr": 2.660418820866983e-06, "optim/total_tokens": 1998594244608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2598845958709717, "created_at": "2025-06-03T10:38:14.738311+00:00"} {"global_step": 238252, "acc_step": 0, "speed/wps": 5523.085583710729, "speed/FLOPS": 244092113085285.1, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.62 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.62, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046674180775880814, "optim/lr": 2.6568715957724364e-06, "optim/total_tokens": 1998602633216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2445050477981567, "created_at": "2025-06-03T10:38:17.714038+00:00"} {"global_step": 238253, "acc_step": 0, "speed/wps": 5530.462062766993, "speed/FLOPS": 244418115703329.44, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04975396394729614, "optim/lr": 2.65332437067789e-06, "optim/total_tokens": 1998611021824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2464908361434937, "created_at": "2025-06-03T10:38:20.682462+00:00"} {"global_step": 238254, "acc_step": 0, "speed/wps": 5534.341336526098, "speed/FLOPS": 244589559747558.78, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04751984402537346, "optim/lr": 2.649777145583343e-06, "optim/total_tokens": 1998619410432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2512844800949097, "created_at": "2025-06-03T10:38:23.650534+00:00"} {"global_step": 238255, "acc_step": 0, "speed/wps": 5522.547933187394, "speed/FLOPS": 244068351684098.53, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04758881777524948, "optim/lr": 2.6462299204890182e-06, "optim/total_tokens": 1998627799040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2535382509231567, "created_at": "2025-06-03T10:38:26.621914+00:00"} {"global_step": 238256, "acc_step": 0, "speed/wps": 5519.416522865051, "speed/FLOPS": 243929959375861.97, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04711119458079338, "optim/lr": 2.6426826953944714e-06, "optim/total_tokens": 1998636187648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2491350173950195, "created_at": "2025-06-03T10:38:29.597241+00:00"} {"global_step": 238257, "acc_step": 0, "speed/wps": 5532.317589589925, "speed/FLOPS": 244500120491455.78, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04732520878314972, "optim/lr": 2.639135470299925e-06, "optim/total_tokens": 1998644576256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2573176622390747, "created_at": "2025-06-03T10:38:32.563148+00:00"} {"global_step": 238258, "acc_step": 0, "speed/wps": 5534.737205936833, "speed/FLOPS": 244607055149269.97, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04746312275528908, "optim/lr": 2.6355882452053782e-06, "optim/total_tokens": 1998652964864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2510793209075928, "created_at": "2025-06-03T10:38:35.527981+00:00"} {"global_step": 238259, "acc_step": 0, "speed/wps": 5528.729670499105, "speed/FLOPS": 244341552832276.25, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04696124419569969, "optim/lr": 2.6320410201110533e-06, "optim/total_tokens": 1998661353472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2551060914993286, "created_at": "2025-06-03T10:38:38.495442+00:00"} {"global_step": 238260, "acc_step": 0, "speed/wps": 5531.075730991891, "speed/FLOPS": 244445236697831.22, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04704342782497406, "optim/lr": 2.6284937950165065e-06, "optim/total_tokens": 1998669742080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2612855434417725, "created_at": "2025-06-03T10:38:41.461794+00:00"} {"global_step": 238261, "acc_step": 0, "speed/wps": 5527.714473339456, "speed/FLOPS": 244296686314069.9, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046888623386621475, "optim/lr": 2.62494656992196e-06, "optim/total_tokens": 1998678130688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2603211402893066, "created_at": "2025-06-03T10:38:44.430908+00:00"} {"global_step": 238262, "acc_step": 0, "speed/wps": 5534.380406473817, "speed/FLOPS": 244591286439269.88, "speed/curr_iter_time": 2.9592, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9592, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 195.85, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047426823526620865, "optim/lr": 2.6213993448276352e-06, "optim/total_tokens": 1998686519296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2464842796325684, "created_at": "2025-06-03T10:38:47.395894+00:00"} {"global_step": 238263, "acc_step": 0, "speed/wps": 5519.582202001832, "speed/FLOPS": 243937281545685.0, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.046853307634592056, "optim/lr": 2.6178521197330884e-06, "optim/total_tokens": 1998694907904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2457739114761353, "created_at": "2025-06-03T10:38:50.368692+00:00"} {"global_step": 238264, "acc_step": 0, "speed/wps": 5524.180235904628, "speed/FLOPS": 244140491109317.56, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047947872430086136, "optim/lr": 2.6143048946385416e-06, "optim/total_tokens": 1998703296512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2490589618682861, "created_at": "2025-06-03T10:38:53.339253+00:00"} {"global_step": 238265, "acc_step": 0, "speed/wps": 5522.137983086816, "speed/FLOPS": 244050233987967.8, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.61 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.61, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04782570153474808, "optim/lr": 2.6107576695439948e-06, "optim/total_tokens": 1998711685120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.249696969985962, "created_at": "2025-06-03T10:38:56.316037+00:00"} {"global_step": 238266, "acc_step": 0, "speed/wps": 5537.664407282272, "speed/FLOPS": 244736422465963.66, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04763961210846901, "optim/lr": 2.6072104444496703e-06, "optim/total_tokens": 1998720073728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2619380950927734, "created_at": "2025-06-03T10:38:59.279064+00:00"} {"global_step": 238267, "acc_step": 0, "speed/wps": 5531.933676307419, "speed/FLOPS": 244483153489415.34, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04754321649670601, "optim/lr": 2.6036632193551235e-06, "optim/total_tokens": 1998728462336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.264634609222412, "created_at": "2025-06-03T10:39:02.246352+00:00"} {"global_step": 238268, "acc_step": 0, "speed/wps": 5540.057959458305, "speed/FLOPS": 244842205220833.7, "speed/curr_iter_time": 2.9563, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9563, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04779820144176483, "optim/lr": 2.6001159942605767e-06, "optim/total_tokens": 1998736850944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2667429447174072, "created_at": "2025-06-03T10:39:05.208111+00:00"} {"global_step": 238269, "acc_step": 0, "speed/wps": 5528.011893780829, "speed/FLOPS": 244309830775242.75, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04705924168229103, "optim/lr": 2.59656876916603e-06, "optim/total_tokens": 1998745239552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.25672447681427, "created_at": "2025-06-03T10:39:08.180343+00:00"} {"global_step": 238270, "acc_step": 0, "speed/wps": 5526.623119629095, "speed/FLOPS": 244248454066126.6, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.04847458750009537, "optim/lr": 2.5930215440717054e-06, "optim/total_tokens": 1998753628160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2669789791107178, "created_at": "2025-06-03T10:39:11.152907+00:00"} {"global_step": 238271, "acc_step": 0, "speed/wps": 5524.69040752654, "speed/FLOPS": 244163038083711.0, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.03, "optim/grad_norm": 0.047238994389772415, "optim/lr": 2.5894743189771585e-06, "optim/total_tokens": 1998762016768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2611019611358643, "created_at": "2025-06-03T10:39:14.122749+00:00"} {"global_step": 238272, "acc_step": 0, "speed/wps": 5526.082387303335, "speed/FLOPS": 244224556465046.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04725264757871628, "optim/lr": 2.5859270938826117e-06, "optim/total_tokens": 1998770405376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2645272016525269, "created_at": "2025-06-03T10:39:17.095292+00:00"} {"global_step": 238273, "acc_step": 0, "speed/wps": 5525.163154571849, "speed/FLOPS": 244183931083374.94, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04709606245160103, "optim/lr": 2.582379868788065e-06, "optim/total_tokens": 1998778793984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2545989751815796, "created_at": "2025-06-03T10:39:20.064943+00:00"} {"global_step": 238274, "acc_step": 0, "speed/wps": 5515.783799793094, "speed/FLOPS": 243769411610043.72, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04841938242316246, "optim/lr": 2.5788326436937404e-06, "optim/total_tokens": 1998787182592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2619926929473877, "created_at": "2025-06-03T10:39:23.042521+00:00"} {"global_step": 238275, "acc_step": 0, "speed/wps": 5531.243296473632, "speed/FLOPS": 244452642234446.28, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047779954969882965, "optim/lr": 2.5752854185991936e-06, "optim/total_tokens": 1998795571200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.250693917274475, "created_at": "2025-06-03T10:39:26.009128+00:00"} {"global_step": 238276, "acc_step": 0, "speed/wps": 5534.962481739093, "speed/FLOPS": 244617011186663.78, "speed/curr_iter_time": 2.9579, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9579, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 195.78, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04728680104017258, "optim/lr": 2.571738193504647e-06, "optim/total_tokens": 1998803959808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2463115453720093, "created_at": "2025-06-03T10:39:28.974023+00:00"} {"global_step": 238277, "acc_step": 0, "speed/wps": 5527.25170786839, "speed/FLOPS": 244276234448897.2, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.6 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.6, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04920673742890358, "optim/lr": 2.5681909684101e-06, "optim/total_tokens": 1998812348416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.253280520439148, "created_at": "2025-06-03T10:39:31.948604+00:00"} {"global_step": 238278, "acc_step": 0, "speed/wps": 5536.608301352935, "speed/FLOPS": 244689747989527.16, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04879855364561081, "optim/lr": 2.5646437433157755e-06, "optim/total_tokens": 1998820737024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.266754150390625, "created_at": "2025-06-03T10:39:34.912302+00:00"} {"global_step": 238279, "acc_step": 0, "speed/wps": 5526.040076019732, "speed/FLOPS": 244222686522880.47, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04742227494716644, "optim/lr": 2.5610965182212287e-06, "optim/total_tokens": 1998829125632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.264658808708191, "created_at": "2025-06-03T10:39:37.886345+00:00"} {"global_step": 238280, "acc_step": 0, "speed/wps": 5521.889718239866, "speed/FLOPS": 244039261952467.28, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.050600193440914154, "optim/lr": 2.557549293126682e-06, "optim/total_tokens": 1998837514240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2468783855438232, "created_at": "2025-06-03T10:39:40.861758+00:00"} {"global_step": 238281, "acc_step": 0, "speed/wps": 5522.664831176267, "speed/FLOPS": 244073517976868.56, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048412516713142395, "optim/lr": 2.554002068032135e-06, "optim/total_tokens": 1998845902848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.246610403060913, "created_at": "2025-06-03T10:39:43.836129+00:00"} {"global_step": 238282, "acc_step": 0, "speed/wps": 5518.6940117541335, "speed/FLOPS": 243898028082906.53, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04675913602113724, "optim/lr": 2.5504548429378106e-06, "optim/total_tokens": 1998854291456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2488186359405518, "created_at": "2025-06-03T10:39:46.809135+00:00"} {"global_step": 238283, "acc_step": 0, "speed/wps": 5525.876396472566, "speed/FLOPS": 244215452724683.62, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0470944382250309, "optim/lr": 2.5469076178432638e-06, "optim/total_tokens": 1998862680064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2447205781936646, "created_at": "2025-06-03T10:39:49.780429+00:00"} {"global_step": 238284, "acc_step": 0, "speed/wps": 5543.794958856924, "speed/FLOPS": 245007361466555.72, "speed/curr_iter_time": 2.9544, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9544, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 195.55, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047975871711969376, "optim/lr": 2.543360392748717e-06, "optim/total_tokens": 1998871068672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.267915964126587, "created_at": "2025-06-03T10:39:52.740469+00:00"} {"global_step": 238285, "acc_step": 0, "speed/wps": 5523.635914486781, "speed/FLOPS": 244116434888738.3, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04730257764458656, "optim/lr": 2.53981316765417e-06, "optim/total_tokens": 1998879457280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.255223274230957, "created_at": "2025-06-03T10:39:55.714501+00:00"} {"global_step": 238286, "acc_step": 0, "speed/wps": 5531.998923698288, "speed/FLOPS": 244486037090125.34, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 195.88, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04780028387904167, "optim/lr": 2.5362659425598457e-06, "optim/total_tokens": 1998887845888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2642333507537842, "created_at": "2025-06-03T10:39:58.680877+00:00"} {"global_step": 238287, "acc_step": 0, "speed/wps": 5527.674425373254, "speed/FLOPS": 244294916398947.84, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04766537621617317, "optim/lr": 2.532718717465299e-06, "optim/total_tokens": 1998896234496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2532577514648438, "created_at": "2025-06-03T10:40:01.650651+00:00"} {"global_step": 238288, "acc_step": 0, "speed/wps": 5524.34681006315, "speed/FLOPS": 244147852834520.4, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04788690432906151, "optim/lr": 2.529171492370752e-06, "optim/total_tokens": 1998904623104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2516719102859497, "created_at": "2025-06-03T10:40:04.620798+00:00"} {"global_step": 238289, "acc_step": 0, "speed/wps": 5516.845250117216, "speed/FLOPS": 243816322281374.66, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04677284136414528, "optim/lr": 2.5256242672764276e-06, "optim/total_tokens": 1998913011712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2551547288894653, "created_at": "2025-06-03T10:40:07.599268+00:00"} {"global_step": 238290, "acc_step": 0, "speed/wps": 5512.021406588565, "speed/FLOPS": 243603133088077.72, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.59 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.59, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04715007543563843, "optim/lr": 2.5220770421818807e-06, "optim/total_tokens": 1998921400320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2548972368240356, "created_at": "2025-06-03T10:40:10.578391+00:00"} {"global_step": 238291, "acc_step": 0, "speed/wps": 5522.368888545925, "speed/FLOPS": 244060438827379.16, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04650075361132622, "optim/lr": 2.518529817087334e-06, "optim/total_tokens": 1998929788928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2522883415222168, "created_at": "2025-06-03T10:40:13.553284+00:00"} {"global_step": 238292, "acc_step": 0, "speed/wps": 5514.669160335738, "speed/FLOPS": 243720150251270.5, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047586265951395035, "optim/lr": 2.514982591992787e-06, "optim/total_tokens": 1998938177536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2552576065063477, "created_at": "2025-06-03T10:40:16.533039+00:00"} {"global_step": 238293, "acc_step": 0, "speed/wps": 5538.0977159415115, "speed/FLOPS": 244755572490827.28, "speed/curr_iter_time": 2.9561, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9561, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 195.67, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047942377626895905, "optim/lr": 2.5114353668984622e-06, "optim/total_tokens": 1998946566144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2679425477981567, "created_at": "2025-06-03T10:40:19.496115+00:00"} {"global_step": 238294, "acc_step": 0, "speed/wps": 5534.529345333063, "speed/FLOPS": 244597868774510.38, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 195.89, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04781367629766464, "optim/lr": 2.507888141803916e-06, "optim/total_tokens": 1998954954752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2563531398773193, "created_at": "2025-06-03T10:40:22.461365+00:00"} {"global_step": 238295, "acc_step": 0, "speed/wps": 5523.522055416031, "speed/FLOPS": 244111402900594.75, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04767072945833206, "optim/lr": 2.504340916709369e-06, "optim/total_tokens": 1998963343360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2536014318466187, "created_at": "2025-06-03T10:40:25.435873+00:00"} {"global_step": 238296, "acc_step": 0, "speed/wps": 5528.846430692343, "speed/FLOPS": 244346713035184.56, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04740092530846596, "optim/lr": 2.500793691614822e-06, "optim/total_tokens": 1998971731968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2536712884902954, "created_at": "2025-06-03T10:40:28.408107+00:00"} {"global_step": 238297, "acc_step": 0, "speed/wps": 5523.416119755373, "speed/FLOPS": 244106721086621.5, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04910173639655113, "optim/lr": 2.4972464665204973e-06, "optim/total_tokens": 1998980120576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.235769271850586, "created_at": "2025-06-03T10:40:31.381752+00:00"} {"global_step": 238298, "acc_step": 0, "speed/wps": 5517.140376074277, "speed/FLOPS": 243829365338085.16, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04772505909204483, "optim/lr": 2.493699241425951e-06, "optim/total_tokens": 1998988509184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2395659685134888, "created_at": "2025-06-03T10:40:34.359518+00:00"} {"global_step": 238299, "acc_step": 0, "speed/wps": 5501.105408514869, "speed/FLOPS": 243120701846363.53, "speed/curr_iter_time": 2.9774, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9774, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 197.09, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04737207666039467, "optim/lr": 2.490152016331404e-06, "optim/total_tokens": 1998996897792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2487118244171143, "created_at": "2025-06-03T10:40:37.341803+00:00"} {"global_step": 238300, "acc_step": 0, "speed/wps": 5529.228995822097, "speed/FLOPS": 244363620455773.8, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.58 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.58, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04735987260937691, "optim/lr": 2.4866047912368573e-06, "optim/total_tokens": 1999005286400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2518874406814575, "created_at": "2025-06-03T10:40:40.309618+00:00"} {"global_step": 238301, "acc_step": 0, "speed/wps": 5543.269347119351, "speed/FLOPS": 244984132118079.75, "speed/curr_iter_time": 2.9546, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9546, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 195.58, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05011989548802376, "optim/lr": 2.4830575661425324e-06, "optim/total_tokens": 1999013675008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.237103819847107, "created_at": "2025-06-03T10:40:43.270770+00:00"} {"global_step": 238302, "acc_step": 0, "speed/wps": 5529.2624528859615, "speed/FLOPS": 244365099086747.84, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047918979078531265, "optim/lr": 2.479510341047986e-06, "optim/total_tokens": 1999022063616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2643376588821411, "created_at": "2025-06-03T10:40:46.242967+00:00"} {"global_step": 238303, "acc_step": 0, "speed/wps": 5523.659208726721, "speed/FLOPS": 244117464374912.94, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04712091386318207, "optim/lr": 2.475963115953439e-06, "optim/total_tokens": 1999030452224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2358605861663818, "created_at": "2025-06-03T10:40:49.213270+00:00"} {"global_step": 238304, "acc_step": 0, "speed/wps": 5543.56521999595, "speed/FLOPS": 244997208184810.8, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 195.57, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04760218784213066, "optim/lr": 2.4724158908588923e-06, "optim/total_tokens": 1999038840832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2536745071411133, "created_at": "2025-06-03T10:40:52.173234+00:00"} {"global_step": 238305, "acc_step": 0, "speed/wps": 5522.1947433183095, "speed/FLOPS": 244052742499674.62, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047323960810899734, "optim/lr": 2.4688686657645674e-06, "optim/total_tokens": 1999047229440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2520549297332764, "created_at": "2025-06-03T10:40:55.144371+00:00"} {"global_step": 238306, "acc_step": 0, "speed/wps": 5530.831044620717, "speed/FLOPS": 244434422812643.72, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04863927885890007, "optim/lr": 2.465321440670021e-06, "optim/total_tokens": 1999055618048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.241851568222046, "created_at": "2025-06-03T10:40:58.115103+00:00"} {"global_step": 238307, "acc_step": 0, "speed/wps": 5516.292852358466, "speed/FLOPS": 243791909127865.94, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.55, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04766426980495453, "optim/lr": 2.4617742155754742e-06, "optim/total_tokens": 1999064006656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2577039003372192, "created_at": "2025-06-03T10:41:01.090004+00:00"} {"global_step": 238308, "acc_step": 0, "speed/wps": 5511.754401691737, "speed/FLOPS": 243591332838292.88, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04760764539241791, "optim/lr": 2.4582269904809274e-06, "optim/total_tokens": 1999072395264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2658944129943848, "created_at": "2025-06-03T10:41:04.066826+00:00"} {"global_step": 238309, "acc_step": 0, "speed/wps": 5527.523514496147, "speed/FLOPS": 244288246910611.6, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0476747527718544, "optim/lr": 2.4546797653866025e-06, "optim/total_tokens": 1999080783872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.240902304649353, "created_at": "2025-06-03T10:41:07.034991+00:00"} {"global_step": 238310, "acc_step": 0, "speed/wps": 5526.4157035339385, "speed/FLOPS": 244239287336372.5, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04778975620865822, "optim/lr": 2.4511325402920557e-06, "optim/total_tokens": 1999089172480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2544771432876587, "created_at": "2025-06-03T10:41:10.004499+00:00"} {"global_step": 238311, "acc_step": 0, "speed/wps": 5527.282617704876, "speed/FLOPS": 244277600505459.0, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04817984625697136, "optim/lr": 2.4475853151975093e-06, "optim/total_tokens": 1999097561088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2404528856277466, "created_at": "2025-06-03T10:41:12.973300+00:00"} {"global_step": 238312, "acc_step": 0, "speed/wps": 5524.878659101313, "speed/FLOPS": 244171357839757.06, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04790882766246796, "optim/lr": 2.4440380901029625e-06, "optim/total_tokens": 1999105949696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.255696415901184, "created_at": "2025-06-03T10:41:15.946397+00:00"} {"global_step": 238313, "acc_step": 0, "speed/wps": 5505.825102149899, "speed/FLOPS": 243329288147449.88, "speed/curr_iter_time": 2.9713, "speed/data_load_time": 0.0023, "speed/curr_step_time": 2.9713, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047688182443380356, "optim/lr": 2.4404908650086376e-06, "optim/total_tokens": 1999114338304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2538087368011475, "created_at": "2025-06-03T10:41:18.927797+00:00"} {"global_step": 238314, "acc_step": 0, "speed/wps": 5516.432841832155, "speed/FLOPS": 243798095946071.9, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0011, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.57 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.57, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047598376870155334, "optim/lr": 2.4369436399140908e-06, "optim/total_tokens": 1999122726912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.25480318069458, "created_at": "2025-06-03T10:41:21.902713+00:00"} {"global_step": 238315, "acc_step": 0, "speed/wps": 5524.510392935051, "speed/FLOPS": 244155082360165.38, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04857780784368515, "optim/lr": 2.4333964148195444e-06, "optim/total_tokens": 1999131115520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2694164514541626, "created_at": "2025-06-03T10:41:24.872762+00:00"} {"global_step": 238316, "acc_step": 0, "speed/wps": 5520.67654641351, "speed/FLOPS": 243985645967318.66, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04699436202645302, "optim/lr": 2.4298491897249976e-06, "optim/total_tokens": 1999139504128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2437766790390015, "created_at": "2025-06-03T10:41:27.850149+00:00"} {"global_step": 238317, "acc_step": 0, "speed/wps": 5533.663348965063, "speed/FLOPS": 244559596167616.0, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04728759452700615, "optim/lr": 2.4263019646306727e-06, "optim/total_tokens": 1999147892736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.252886176109314, "created_at": "2025-06-03T10:41:30.816372+00:00"} {"global_step": 238318, "acc_step": 0, "speed/wps": 5517.1342488417185, "speed/FLOPS": 243829094545768.1, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0543966218829155, "optim/lr": 2.422754739536126e-06, "optim/total_tokens": 1999156281344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2609151601791382, "created_at": "2025-06-03T10:41:33.790356+00:00"} {"global_step": 238319, "acc_step": 0, "speed/wps": 5520.581303122941, "speed/FLOPS": 243981436701374.88, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04797419160604477, "optim/lr": 2.4192075144415795e-06, "optim/total_tokens": 1999164669952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2380295991897583, "created_at": "2025-06-03T10:41:36.763502+00:00"} {"global_step": 238320, "acc_step": 0, "speed/wps": 5534.082524512981, "speed/FLOPS": 244578121581299.0, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 195.84, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04846208542585373, "optim/lr": 2.4156602893472546e-06, "optim/total_tokens": 1999173058560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2428085803985596, "created_at": "2025-06-03T10:41:39.728673+00:00"} {"global_step": 238321, "acc_step": 0, "speed/wps": 5524.586415264793, "speed/FLOPS": 244158442158022.4, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04730299487709999, "optim/lr": 2.4121130642527077e-06, "optim/total_tokens": 1999181447168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2689721584320068, "created_at": "2025-06-03T10:41:42.702455+00:00"} {"global_step": 238322, "acc_step": 0, "speed/wps": 5520.445345474677, "speed/FLOPS": 243975428069215.94, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047028910368680954, "optim/lr": 2.408565839158161e-06, "optim/total_tokens": 1999189835776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.265789270401001, "created_at": "2025-06-03T10:41:45.678315+00:00"} {"global_step": 238323, "acc_step": 0, "speed/wps": 5525.021844083373, "speed/FLOPS": 244177685883076.94, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047161493450403214, "optim/lr": 2.4050186140636145e-06, "optim/total_tokens": 1999198224384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2559641599655151, "created_at": "2025-06-03T10:41:48.654511+00:00"} {"global_step": 238324, "acc_step": 0, "speed/wps": 5510.521756689161, "speed/FLOPS": 243536856238428.06, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04788578301668167, "optim/lr": 2.4014713889692896e-06, "optim/total_tokens": 1999206612992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2545007467269897, "created_at": "2025-06-03T10:41:51.636385+00:00"} {"global_step": 238325, "acc_step": 0, "speed/wps": 5530.4869385249485, "speed/FLOPS": 244419215084505.4, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04747554659843445, "optim/lr": 2.397924163874743e-06, "optim/total_tokens": 1999215001600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2612359523773193, "created_at": "2025-06-03T10:41:54.607261+00:00"} {"global_step": 238326, "acc_step": 0, "speed/wps": 5524.481523491889, "speed/FLOPS": 244153806478544.8, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.56 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.56, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04726386070251465, "optim/lr": 2.394376938780196e-06, "optim/total_tokens": 1999223390208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2553377151489258, "created_at": "2025-06-03T10:41:57.577683+00:00"} {"global_step": 238327, "acc_step": 0, "speed/wps": 5525.0468791508265, "speed/FLOPS": 244178792304917.28, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.16, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04808172211050987, "optim/lr": 2.390829713685649e-06, "optim/total_tokens": 1999231778816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.255840539932251, "created_at": "2025-06-03T10:42:00.547980+00:00"} {"global_step": 238328, "acc_step": 0, "speed/wps": 5521.052169797357, "speed/FLOPS": 244002246598269.97, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047566503286361694, "optim/lr": 2.3872824885913247e-06, "optim/total_tokens": 1999240167424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2544708251953125, "created_at": "2025-06-03T10:42:03.519974+00:00"} {"global_step": 238329, "acc_step": 0, "speed/wps": 5528.674425161026, "speed/FLOPS": 244339111271104.44, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04788857698440552, "optim/lr": 2.383735263496778e-06, "optim/total_tokens": 1999248556032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2553836107254028, "created_at": "2025-06-03T10:42:06.488195+00:00"} {"global_step": 238330, "acc_step": 0, "speed/wps": 5521.950845094949, "speed/FLOPS": 244041963446586.34, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047232262790203094, "optim/lr": 2.380188038402231e-06, "optim/total_tokens": 1999256944640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.265548825263977, "created_at": "2025-06-03T10:42:09.460372+00:00"} {"global_step": 238331, "acc_step": 0, "speed/wps": 5523.591451975566, "speed/FLOPS": 244114469873322.38, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04760803282260895, "optim/lr": 2.3766408133076843e-06, "optim/total_tokens": 1999265333248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2570013999938965, "created_at": "2025-06-03T10:42:12.433867+00:00"} {"global_step": 238332, "acc_step": 0, "speed/wps": 5517.009341911345, "speed/FLOPS": 243823574298777.2, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04722961038351059, "optim/lr": 2.3730935882133598e-06, "optim/total_tokens": 1999273721856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2592368125915527, "created_at": "2025-06-03T10:42:15.409413+00:00"} {"global_step": 238333, "acc_step": 0, "speed/wps": 5516.879191124831, "speed/FLOPS": 243817822300185.4, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04822177439928055, "optim/lr": 2.369546363118813e-06, "optim/total_tokens": 1999282110464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.263016939163208, "created_at": "2025-06-03T10:42:18.383889+00:00"} {"global_step": 238334, "acc_step": 0, "speed/wps": 5532.381489412107, "speed/FLOPS": 244502944536527.3, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047662779688835144, "optim/lr": 2.365999138024266e-06, "optim/total_tokens": 1999290499072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2426097393035889, "created_at": "2025-06-03T10:42:21.353848+00:00"} {"global_step": 238335, "acc_step": 0, "speed/wps": 5526.240169840045, "speed/FLOPS": 244231529645565.3, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047373440116643906, "optim/lr": 2.3624519129297193e-06, "optim/total_tokens": 1999298887680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2560831308364868, "created_at": "2025-06-03T10:42:24.323401+00:00"} {"global_step": 238336, "acc_step": 0, "speed/wps": 5522.634262492603, "speed/FLOPS": 244072166997515.3, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04759439080953598, "optim/lr": 2.358904687835395e-06, "optim/total_tokens": 1999307276288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2694780826568604, "created_at": "2025-06-03T10:42:27.295154+00:00"} {"global_step": 238337, "acc_step": 0, "speed/wps": 5520.682595759355, "speed/FLOPS": 243985913317441.66, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04775013029575348, "optim/lr": 2.355357462740848e-06, "optim/total_tokens": 1999315664896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2461531162261963, "created_at": "2025-06-03T10:42:30.270434+00:00"} {"global_step": 238338, "acc_step": 0, "speed/wps": 5528.514199813647, "speed/FLOPS": 244332030130857.97, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04807930067181587, "optim/lr": 2.3518102376463012e-06, "optim/total_tokens": 1999324053504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2610844373703003, "created_at": "2025-06-03T10:42:33.238450+00:00"} {"global_step": 238339, "acc_step": 0, "speed/wps": 5514.006635202129, "speed/FLOPS": 243690870031476.03, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.55 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.55, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047782957553863525, "optim/lr": 2.3482630125517544e-06, "optim/total_tokens": 1999332442112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2477775812149048, "created_at": "2025-06-03T10:42:36.214295+00:00"} {"global_step": 238340, "acc_step": 0, "speed/wps": 5515.149479835993, "speed/FLOPS": 243741377914683.72, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04806045815348625, "optim/lr": 2.34471578745743e-06, "optim/total_tokens": 1999340830720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.233836054801941, "created_at": "2025-06-03T10:42:39.189520+00:00"} {"global_step": 238341, "acc_step": 0, "speed/wps": 5523.21353435575, "speed/FLOPS": 244097767848884.25, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04917389526963234, "optim/lr": 2.341168562362883e-06, "optim/total_tokens": 1999349219328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2591865062713623, "created_at": "2025-06-03T10:42:42.162895+00:00"} {"global_step": 238342, "acc_step": 0, "speed/wps": 5532.509443551388, "speed/FLOPS": 244508599454554.88, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04793722555041313, "optim/lr": 2.3376213372683363e-06, "optim/total_tokens": 1999357607936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2551803588867188, "created_at": "2025-06-03T10:42:45.129385+00:00"} {"global_step": 238343, "acc_step": 0, "speed/wps": 5521.775976207979, "speed/FLOPS": 244034235136842.38, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04911721870303154, "optim/lr": 2.3340741121737895e-06, "optim/total_tokens": 1999365996544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.248999834060669, "created_at": "2025-06-03T10:42:48.105110+00:00"} {"global_step": 238344, "acc_step": 0, "speed/wps": 5521.753694839138, "speed/FLOPS": 244033250414386.0, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05049881711602211, "optim/lr": 2.330526887079465e-06, "optim/total_tokens": 1999374385152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2624098062515259, "created_at": "2025-06-03T10:42:51.079724+00:00"} {"global_step": 238345, "acc_step": 0, "speed/wps": 5511.160553286094, "speed/FLOPS": 243565087778355.12, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04821361228823662, "optim/lr": 2.326979661984918e-06, "optim/total_tokens": 1999382773760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.247493028640747, "created_at": "2025-06-03T10:42:54.058916+00:00"} {"global_step": 238346, "acc_step": 0, "speed/wps": 5527.266734670264, "speed/FLOPS": 244276898556625.84, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04768063500523567, "optim/lr": 2.3234324368903714e-06, "optim/total_tokens": 1999391162368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.260411262512207, "created_at": "2025-06-03T10:42:57.030429+00:00"} {"global_step": 238347, "acc_step": 0, "speed/wps": 5511.078449557072, "speed/FLOPS": 243561459213777.38, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047737766057252884, "optim/lr": 2.319885211796047e-06, "optim/total_tokens": 1999399550976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2433359622955322, "created_at": "2025-06-03T10:43:00.011252+00:00"} {"global_step": 238348, "acc_step": 0, "speed/wps": 5505.4698741492875, "speed/FLOPS": 243313588888044.6, "speed/curr_iter_time": 2.975, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.975, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.97, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04721163213253021, "optim/lr": 2.3163379867015e-06, "optim/total_tokens": 1999407939584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.244315266609192, "created_at": "2025-06-03T10:43:02.992040+00:00"} {"global_step": 238349, "acc_step": 0, "speed/wps": 5509.830520152834, "speed/FLOPS": 243506307121591.75, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04745153337717056, "optim/lr": 2.3127907616069533e-06, "optim/total_tokens": 1999416328192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2622085809707642, "created_at": "2025-06-03T10:43:05.970923+00:00"} {"global_step": 238350, "acc_step": 0, "speed/wps": 5523.375955428785, "speed/FLOPS": 244104946028966.0, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.54 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.54, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04863698408007622, "optim/lr": 2.3092435365124065e-06, "optim/total_tokens": 1999424716800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2701948881149292, "created_at": "2025-06-03T10:43:08.942435+00:00"} {"global_step": 238351, "acc_step": 0, "speed/wps": 5528.684668984519, "speed/FLOPS": 244339563995670.2, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0477074533700943, "optim/lr": 2.305696311418082e-06, "optim/total_tokens": 1999433105408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2473092079162598, "created_at": "2025-06-03T10:43:11.916873+00:00"} {"global_step": 238352, "acc_step": 0, "speed/wps": 5514.2527181975565, "speed/FLOPS": 243701745640307.0, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04723319783806801, "optim/lr": 2.302149086323535e-06, "optim/total_tokens": 1999441494016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2276910543441772, "created_at": "2025-06-03T10:43:14.893436+00:00"} {"global_step": 238353, "acc_step": 0, "speed/wps": 5531.061157346883, "speed/FLOPS": 244444592617316.56, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04743952304124832, "optim/lr": 2.2986018612289883e-06, "optim/total_tokens": 1999449882624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.238002061843872, "created_at": "2025-06-03T10:43:17.860632+00:00"} {"global_step": 238354, "acc_step": 0, "speed/wps": 5524.174540568302, "speed/FLOPS": 244140239404603.34, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04709101468324661, "optim/lr": 2.2950546361344415e-06, "optim/total_tokens": 1999458271232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2528800964355469, "created_at": "2025-06-03T10:43:20.833647+00:00"} {"global_step": 238355, "acc_step": 0, "speed/wps": 5515.720263782174, "speed/FLOPS": 243766603643567.84, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048345889896154404, "optim/lr": 2.2915074110401166e-06, "optim/total_tokens": 1999466659840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2382631301879883, "created_at": "2025-06-03T10:43:23.811115+00:00"} {"global_step": 238356, "acc_step": 0, "speed/wps": 5524.133971882104, "speed/FLOPS": 244138446476322.72, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04805012419819832, "optim/lr": 2.2879601859455702e-06, "optim/total_tokens": 1999475048448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2474027872085571, "created_at": "2025-06-03T10:43:26.782036+00:00"} {"global_step": 238357, "acc_step": 0, "speed/wps": 5514.3466404643095, "speed/FLOPS": 243705896523759.75, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04730459302663803, "optim/lr": 2.2844129608510234e-06, "optim/total_tokens": 1999483437056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2631412744522095, "created_at": "2025-06-03T10:43:29.758338+00:00"} {"global_step": 238358, "acc_step": 0, "speed/wps": 5522.170020102905, "speed/FLOPS": 244051649860098.62, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04765436053276062, "optim/lr": 2.2808657357564766e-06, "optim/total_tokens": 1999491825664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2527066469192505, "created_at": "2025-06-03T10:43:32.733113+00:00"} {"global_step": 238359, "acc_step": 0, "speed/wps": 5528.045455976539, "speed/FLOPS": 244311314052506.25, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04838084056973457, "optim/lr": 2.2773185106621517e-06, "optim/total_tokens": 1999500214272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2488744258880615, "created_at": "2025-06-03T10:43:35.701973+00:00"} {"global_step": 238360, "acc_step": 0, "speed/wps": 5519.859196719911, "speed/FLOPS": 243949523294436.6, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047905467450618744, "optim/lr": 2.2737712855676053e-06, "optim/total_tokens": 1999508602880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2522809505462646, "created_at": "2025-06-03T10:43:38.676005+00:00"} {"global_step": 238361, "acc_step": 0, "speed/wps": 5521.833657122268, "speed/FLOPS": 244036784338016.28, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04727065935730934, "optim/lr": 2.2702240604730585e-06, "optim/total_tokens": 1999516991488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2491421699523926, "created_at": "2025-06-03T10:43:41.652065+00:00"} {"global_step": 238362, "acc_step": 0, "speed/wps": 5524.019237137029, "speed/FLOPS": 244133375787856.1, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.53 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.53, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04779605567455292, "optim/lr": 2.2666768353785117e-06, "optim/total_tokens": 1999525380096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2526373863220215, "created_at": "2025-06-03T10:43:44.624515+00:00"} {"global_step": 238363, "acc_step": 0, "speed/wps": 5524.923911001797, "speed/FLOPS": 244173357742138.22, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047392696142196655, "optim/lr": 2.2631296102841868e-06, "optim/total_tokens": 1999533768704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2617782354354858, "created_at": "2025-06-03T10:43:47.594222+00:00"} {"global_step": 238364, "acc_step": 0, "speed/wps": 5514.475876206544, "speed/FLOPS": 243711608082078.0, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047026123851537704, "optim/lr": 2.2595823851896404e-06, "optim/total_tokens": 1999542157312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2305363416671753, "created_at": "2025-06-03T10:43:50.570248+00:00"} {"global_step": 238365, "acc_step": 0, "speed/wps": 5525.613068190997, "speed/FLOPS": 244203814962474.62, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04755476489663124, "optim/lr": 2.2560351600950936e-06, "optim/total_tokens": 1999550545920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.258292317390442, "created_at": "2025-06-03T10:43:53.541307+00:00"} {"global_step": 238366, "acc_step": 0, "speed/wps": 5521.33894515113, "speed/FLOPS": 244014920601057.4, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04823741689324379, "optim/lr": 2.2524879350005468e-06, "optim/total_tokens": 1999558934528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2613366842269897, "created_at": "2025-06-03T10:43:56.517303+00:00"} {"global_step": 238367, "acc_step": 0, "speed/wps": 5517.14267081613, "speed/FLOPS": 243829466753929.5, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04783264920115471, "optim/lr": 2.248940709906222e-06, "optim/total_tokens": 1999567323136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.244894027709961, "created_at": "2025-06-03T10:43:59.493433+00:00"} {"global_step": 238368, "acc_step": 0, "speed/wps": 5529.398930776032, "speed/FLOPS": 244371130710931.8, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048142120242118835, "optim/lr": 2.2453934848116755e-06, "optim/total_tokens": 1999575711744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2515887022018433, "created_at": "2025-06-03T10:44:02.461027+00:00"} {"global_step": 238369, "acc_step": 0, "speed/wps": 5521.719853707679, "speed/FLOPS": 244031754809590.12, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04749041050672531, "optim/lr": 2.2418462597171286e-06, "optim/total_tokens": 1999584100352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2606360912322998, "created_at": "2025-06-03T10:44:05.437437+00:00"} {"global_step": 238370, "acc_step": 0, "speed/wps": 5517.698324883412, "speed/FLOPS": 243854023819608.03, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04726884141564369, "optim/lr": 2.238299034622582e-06, "optim/total_tokens": 1999592488960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2686465978622437, "created_at": "2025-06-03T10:44:08.411211+00:00"} {"global_step": 238371, "acc_step": 0, "speed/wps": 5527.687731932802, "speed/FLOPS": 244295504480770.72, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048410478979349136, "optim/lr": 2.234751809528257e-06, "optim/total_tokens": 1999600877568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.252408504486084, "created_at": "2025-06-03T10:44:11.379431+00:00"} {"global_step": 238372, "acc_step": 0, "speed/wps": 5528.371167324213, "speed/FLOPS": 244325708826931.62, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04857053607702255, "optim/lr": 2.23120458443371e-06, "optim/total_tokens": 1999609266176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2617439031600952, "created_at": "2025-06-03T10:44:14.351218+00:00"} {"global_step": 238373, "acc_step": 0, "speed/wps": 5510.525233917251, "speed/FLOPS": 243537009914111.6, "speed/curr_iter_time": 2.9723, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9723, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04780808091163635, "optim/lr": 2.2276573593391637e-06, "optim/total_tokens": 1999617654784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2475636005401611, "created_at": "2025-06-03T10:44:17.331964+00:00"} {"global_step": 238374, "acc_step": 0, "speed/wps": 5514.669342281203, "speed/FLOPS": 243720158292328.8, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.52 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.52, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05506699159741402, "optim/lr": 2.224110134244839e-06, "optim/total_tokens": 1999626043392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2477277517318726, "created_at": "2025-06-03T10:44:20.307848+00:00"} {"global_step": 238375, "acc_step": 0, "speed/wps": 5525.270762890828, "speed/FLOPS": 244188686820284.5, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04764263331890106, "optim/lr": 2.220562909150292e-06, "optim/total_tokens": 1999634432000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.259414792060852, "created_at": "2025-06-03T10:44:23.277209+00:00"} {"global_step": 238376, "acc_step": 0, "speed/wps": 5521.972083753797, "speed/FLOPS": 244042902086598.12, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048533037304878235, "optim/lr": 2.217015684055745e-06, "optim/total_tokens": 1999642820608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2582252025604248, "created_at": "2025-06-03T10:44:26.249161+00:00"} {"global_step": 238377, "acc_step": 0, "speed/wps": 5524.234776944657, "speed/FLOPS": 244142901544120.5, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04824144020676613, "optim/lr": 2.213468458961199e-06, "optim/total_tokens": 1999651209216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.251582145690918, "created_at": "2025-06-03T10:44:29.219361+00:00"} {"global_step": 238378, "acc_step": 0, "speed/wps": 5527.958613915597, "speed/FLOPS": 244307476077910.6, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04722132161259651, "optim/lr": 2.209921233866874e-06, "optim/total_tokens": 1999659597824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2581263780593872, "created_at": "2025-06-03T10:44:32.188773+00:00"} {"global_step": 238379, "acc_step": 0, "speed/wps": 5525.8790191639755, "speed/FLOPS": 244215568634219.78, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047839391976594925, "optim/lr": 2.206374008772327e-06, "optim/total_tokens": 1999667986432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2454649209976196, "created_at": "2025-06-03T10:44:35.160608+00:00"} {"global_step": 238380, "acc_step": 0, "speed/wps": 5522.573381421457, "speed/FLOPS": 244069476365788.25, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04759162664413452, "optim/lr": 2.2028267836777803e-06, "optim/total_tokens": 1999676375040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2683444023132324, "created_at": "2025-06-03T10:44:38.131809+00:00"} {"global_step": 238381, "acc_step": 0, "speed/wps": 5516.811991163549, "speed/FLOPS": 243814852405857.3, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047369178384542465, "optim/lr": 2.199279558583234e-06, "optim/total_tokens": 1999684763648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2661254405975342, "created_at": "2025-06-03T10:44:41.105886+00:00"} {"global_step": 238382, "acc_step": 0, "speed/wps": 5538.477889009125, "speed/FLOPS": 244772374194513.62, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04722091183066368, "optim/lr": 2.195732333488909e-06, "optim/total_tokens": 1999693152256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2354161739349365, "created_at": "2025-06-03T10:44:44.072997+00:00"} {"global_step": 238383, "acc_step": 0, "speed/wps": 5510.655364717198, "speed/FLOPS": 243542761029399.44, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049006387591362, "optim/lr": 2.192185108394362e-06, "optim/total_tokens": 1999701540864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.243100881576538, "created_at": "2025-06-03T10:44:47.054960+00:00"} {"global_step": 238384, "acc_step": 0, "speed/wps": 5518.383753489925, "speed/FLOPS": 243884316255674.25, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04727708175778389, "optim/lr": 2.1886378832998153e-06, "optim/total_tokens": 1999709929472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2513487339019775, "created_at": "2025-06-03T10:44:50.031811+00:00"} {"global_step": 238385, "acc_step": 0, "speed/wps": 5529.46003368859, "speed/FLOPS": 244373831146913.78, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04767364263534546, "optim/lr": 2.185090658205269e-06, "optim/total_tokens": 1999718318080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2677332162857056, "created_at": "2025-06-03T10:44:52.999479+00:00"} {"global_step": 238386, "acc_step": 0, "speed/wps": 5531.328329563188, "speed/FLOPS": 244456400261765.88, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.51 hours", "speed/est_time_elapsed_hrs": 196.08, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.51, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04772765934467316, "optim/lr": 2.181543433110944e-06, "optim/total_tokens": 1999726706688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2539860010147095, "created_at": "2025-06-03T10:44:55.965901+00:00"} {"global_step": 238387, "acc_step": 0, "speed/wps": 5524.009684470971, "speed/FLOPS": 244132953608911.28, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048081815242767334, "optim/lr": 2.1779962080163972e-06, "optim/total_tokens": 1999735095296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2498868703842163, "created_at": "2025-06-03T10:44:58.940298+00:00"} {"global_step": 238388, "acc_step": 0, "speed/wps": 5526.9599830338575, "speed/FLOPS": 244263341704393.9, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04810439050197601, "optim/lr": 2.1744489829218504e-06, "optim/total_tokens": 1999743483904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2600313425064087, "created_at": "2025-06-03T10:45:01.908881+00:00"} {"global_step": 238389, "acc_step": 0, "speed/wps": 5518.766185621659, "speed/FLOPS": 243901217798431.8, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04714405909180641, "optim/lr": 2.1709017578273036e-06, "optim/total_tokens": 1999751872512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2578206062316895, "created_at": "2025-06-03T10:45:04.886637+00:00"} {"global_step": 238390, "acc_step": 0, "speed/wps": 5518.784442330814, "speed/FLOPS": 243902024651530.16, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04769185930490494, "optim/lr": 2.167354532732979e-06, "optim/total_tokens": 1999760261120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.263368010520935, "created_at": "2025-06-03T10:45:07.862463+00:00"} {"global_step": 238391, "acc_step": 0, "speed/wps": 5523.32550784709, "speed/FLOPS": 244102716504069.2, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049368634819984436, "optim/lr": 2.1638073076384323e-06, "optim/total_tokens": 1999768649728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2691575288772583, "created_at": "2025-06-03T10:45:10.833518+00:00"} {"global_step": 238392, "acc_step": 0, "speed/wps": 5514.483561901734, "speed/FLOPS": 243711947750466.47, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04940236359834671, "optim/lr": 2.1602600825438855e-06, "optim/total_tokens": 1999777038336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2445881366729736, "created_at": "2025-06-03T10:45:13.809090+00:00"} {"global_step": 238393, "acc_step": 0, "speed/wps": 5525.986873212447, "speed/FLOPS": 244220335231115.16, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04781528189778328, "optim/lr": 2.1567128574493387e-06, "optim/total_tokens": 1999785426944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2499288320541382, "created_at": "2025-06-03T10:45:16.778355+00:00"} {"global_step": 238394, "acc_step": 0, "speed/wps": 5532.14896739833, "speed/FLOPS": 244492668253673.9, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04759414121508598, "optim/lr": 2.153165632355014e-06, "optim/total_tokens": 1999793815552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.259852647781372, "created_at": "2025-06-03T10:45:19.747203+00:00"} {"global_step": 238395, "acc_step": 0, "speed/wps": 5522.416664141471, "speed/FLOPS": 244062550264164.62, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049532391130924225, "optim/lr": 2.1496184072604674e-06, "optim/total_tokens": 1999802204160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2401196956634521, "created_at": "2025-06-03T10:45:22.718960+00:00"} {"global_step": 238396, "acc_step": 0, "speed/wps": 5517.5960861006715, "speed/FLOPS": 243849505388716.44, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04915624484419823, "optim/lr": 2.1460711821659206e-06, "optim/total_tokens": 1999810592768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2558673620224, "created_at": "2025-06-03T10:45:25.692757+00:00"} {"global_step": 238397, "acc_step": 0, "speed/wps": 5517.984203698454, "speed/FLOPS": 243866658199972.47, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05005302280187607, "optim/lr": 2.1425239570713738e-06, "optim/total_tokens": 1999818981376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2605408430099487, "created_at": "2025-06-03T10:45:28.665983+00:00"} {"global_step": 238398, "acc_step": 0, "speed/wps": 5522.121600493064, "speed/FLOPS": 244049509961177.7, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04745462164282799, "optim/lr": 2.1389767319770493e-06, "optim/total_tokens": 1999827369984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2420395612716675, "created_at": "2025-06-03T10:45:31.637867+00:00"} {"global_step": 238399, "acc_step": 0, "speed/wps": 5514.340547955634, "speed/FLOPS": 243705627266060.56, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.5 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.5, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04808855801820755, "optim/lr": 2.1354295068825025e-06, "optim/total_tokens": 1999835758592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.263999342918396, "created_at": "2025-06-03T10:45:34.613607+00:00"} {"global_step": 238400, "acc_step": 0, "speed/wps": 5517.096265926834, "speed/FLOPS": 243827415895344.4, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04893915355205536, "optim/lr": 2.1318822817879556e-06, "optim/total_tokens": 1999844147200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.266847848892212, "created_at": "2025-06-03T10:45:37.587826+00:00"} {"global_step": 238401, "acc_step": 0, "speed/wps": 5523.695440602926, "speed/FLOPS": 244119065638389.66, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04757893830537796, "optim/lr": 2.128335056693631e-06, "optim/total_tokens": 1999852535808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2596478462219238, "created_at": "2025-06-03T10:45:40.558047+00:00"} {"global_step": 238402, "acc_step": 0, "speed/wps": 5521.723903148273, "speed/FLOPS": 244031933774137.47, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04777684807777405, "optim/lr": 2.1247878315990844e-06, "optim/total_tokens": 1999860924416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2375937700271606, "created_at": "2025-06-03T10:45:43.532245+00:00"} {"global_step": 238403, "acc_step": 0, "speed/wps": 5529.596387066817, "speed/FLOPS": 244379857268311.6, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049396682530641556, "optim/lr": 2.1212406065045375e-06, "optim/total_tokens": 1999869313024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.249116063117981, "created_at": "2025-06-03T10:45:46.501436+00:00"} {"global_step": 238404, "acc_step": 0, "speed/wps": 5520.3966646467225, "speed/FLOPS": 243973276625791.4, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04767788574099541, "optim/lr": 2.1176933814099907e-06, "optim/total_tokens": 1999877701632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2405941486358643, "created_at": "2025-06-03T10:45:49.473485+00:00"} {"global_step": 238405, "acc_step": 0, "speed/wps": 5525.496835442805, "speed/FLOPS": 244198678069937.62, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0501825325191021, "optim/lr": 2.1141461563156663e-06, "optim/total_tokens": 1999886090240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2449549436569214, "created_at": "2025-06-03T10:45:52.444168+00:00"} {"global_step": 238406, "acc_step": 0, "speed/wps": 5528.056626818451, "speed/FLOPS": 244311807746541.22, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04836674779653549, "optim/lr": 2.1105989312211194e-06, "optim/total_tokens": 1999894478848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2569196224212646, "created_at": "2025-06-03T10:45:55.413446+00:00"} {"global_step": 238407, "acc_step": 0, "speed/wps": 5517.059509379163, "speed/FLOPS": 243825791444074.38, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04776359349489212, "optim/lr": 2.1070517061265726e-06, "optim/total_tokens": 1999902867456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2462238073349, "created_at": "2025-06-03T10:45:58.388298+00:00"} {"global_step": 238408, "acc_step": 0, "speed/wps": 5517.19467177874, "speed/FLOPS": 243831764930311.8, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04881763458251953, "optim/lr": 2.103504481032026e-06, "optim/total_tokens": 1999911256064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2500096559524536, "created_at": "2025-06-03T10:46:01.365956+00:00"} {"global_step": 238409, "acc_step": 0, "speed/wps": 5515.997454295329, "speed/FLOPS": 243778854045459.62, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.64, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047446489334106445, "optim/lr": 2.0999572559377013e-06, "optim/total_tokens": 1999919644672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.267390251159668, "created_at": "2025-06-03T10:46:04.344230+00:00"} {"global_step": 238410, "acc_step": 0, "speed/wps": 5527.013936926644, "speed/FLOPS": 244265726190294.03, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04728158563375473, "optim/lr": 2.0964100308431545e-06, "optim/total_tokens": 1999928033280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.248591423034668, "created_at": "2025-06-03T10:46:07.315032+00:00"} {"global_step": 238411, "acc_step": 0, "speed/wps": 5522.016463865817, "speed/FLOPS": 244044863460391.4, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.49 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.49, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0501951240003109, "optim/lr": 2.0928628057486077e-06, "optim/total_tokens": 1999936421888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.258603811264038, "created_at": "2025-06-03T10:46:10.289841+00:00"} {"global_step": 238412, "acc_step": 0, "speed/wps": 5521.511056897357, "speed/FLOPS": 244022527059292.84, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04872014373540878, "optim/lr": 2.089315580654061e-06, "optim/total_tokens": 1999944810496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.243099331855774, "created_at": "2025-06-03T10:46:13.261717+00:00"} {"global_step": 238413, "acc_step": 0, "speed/wps": 5516.939720068084, "speed/FLOPS": 243820497369661.97, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04781362786889076, "optim/lr": 2.0857683555597364e-06, "optim/total_tokens": 1999953199104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2574236392974854, "created_at": "2025-06-03T10:46:16.239293+00:00"} {"global_step": 238414, "acc_step": 0, "speed/wps": 5517.511480319303, "speed/FLOPS": 243845766246231.6, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047483015805482864, "optim/lr": 2.0822211304651896e-06, "optim/total_tokens": 1999961587712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.255934476852417, "created_at": "2025-06-03T10:46:19.213477+00:00"} {"global_step": 238415, "acc_step": 0, "speed/wps": 5516.678238398901, "speed/FLOPS": 243808941218268.6, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04808349907398224, "optim/lr": 2.0786739053706428e-06, "optim/total_tokens": 1999969976320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2551006078720093, "created_at": "2025-06-03T10:46:22.192745+00:00"} {"global_step": 238416, "acc_step": 0, "speed/wps": 5514.201777744509, "speed/FLOPS": 243699494333019.2, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04820564389228821, "optim/lr": 2.075126680276096e-06, "optim/total_tokens": 1999978364928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2527087926864624, "created_at": "2025-06-03T10:46:25.168507+00:00"} {"global_step": 238417, "acc_step": 0, "speed/wps": 5530.841365556938, "speed/FLOPS": 244434878945197.38, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04792504757642746, "optim/lr": 2.0715794551817715e-06, "optim/total_tokens": 1999986753536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2302210330963135, "created_at": "2025-06-03T10:46:28.135385+00:00"} {"global_step": 238418, "acc_step": 0, "speed/wps": 5525.923200866561, "speed/FLOPS": 244217521239331.6, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04854729399085045, "optim/lr": 2.0680322300872247e-06, "optim/total_tokens": 1999995142144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2741291522979736, "created_at": "2025-06-03T10:46:31.104275+00:00"} {"global_step": 238419, "acc_step": 0, "speed/wps": 5533.93966550459, "speed/FLOPS": 244571807944346.84, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04794004186987877, "optim/lr": 2.064485004992678e-06, "optim/total_tokens": 2000003530752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2603094577789307, "created_at": "2025-06-03T10:46:34.069210+00:00"} {"global_step": 238420, "acc_step": 0, "speed/wps": 5535.696125315904, "speed/FLOPS": 244649434477630.6, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 195.95, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04741361364722252, "optim/lr": 2.060937779898131e-06, "optim/total_tokens": 2000011919360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2593326568603516, "created_at": "2025-06-03T10:46:37.033485+00:00"} {"global_step": 238421, "acc_step": 0, "speed/wps": 5513.504522800678, "speed/FLOPS": 243668679233376.2, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047605812549591064, "optim/lr": 2.057390554803806e-06, "optim/total_tokens": 2000020307968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2697219848632812, "created_at": "2025-06-03T10:46:40.010712+00:00"} {"global_step": 238422, "acc_step": 0, "speed/wps": 5530.08204320211, "speed/FLOPS": 244401320783678.1, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04757886379957199, "optim/lr": 2.0538433297092597e-06, "optim/total_tokens": 2000028696576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2463666200637817, "created_at": "2025-06-03T10:46:42.982449+00:00"} {"global_step": 238423, "acc_step": 0, "speed/wps": 5528.761255831717, "speed/FLOPS": 244342948742309.3, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.2, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047254983335733414, "optim/lr": 2.050296104614713e-06, "optim/total_tokens": 2000037085184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2571393251419067, "created_at": "2025-06-03T10:46:45.953898+00:00"} {"global_step": 238424, "acc_step": 0, "speed/wps": 5525.291716031659, "speed/FLOPS": 244189612841861.34, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04808320477604866, "optim/lr": 2.046748879520166e-06, "optim/total_tokens": 2000045473792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2414791584014893, "created_at": "2025-06-03T10:46:48.923944+00:00"} {"global_step": 238425, "acc_step": 0, "speed/wps": 5506.918146119156, "speed/FLOPS": 243377595096184.8, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.48 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.48, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048862144351005554, "optim/lr": 2.043201654425841e-06, "optim/total_tokens": 2000053862400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2522046566009521, "created_at": "2025-06-03T10:46:51.905226+00:00"} {"global_step": 238426, "acc_step": 0, "speed/wps": 5532.47252266521, "speed/FLOPS": 244506967740364.03, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.07, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047734908759593964, "optim/lr": 2.039654429331295e-06, "optim/total_tokens": 2000062251008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2325670719146729, "created_at": "2025-06-03T10:46:54.871497+00:00"} {"global_step": 238427, "acc_step": 0, "speed/wps": 5528.394371221785, "speed/FLOPS": 244326734320436.0, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04715777188539505, "optim/lr": 2.036107204236748e-06, "optim/total_tokens": 2000070639616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2514662742614746, "created_at": "2025-06-03T10:46:57.840839+00:00"} {"global_step": 238428, "acc_step": 0, "speed/wps": 5531.553871044303, "speed/FLOPS": 244466368040805.22, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04819914698600769, "optim/lr": 2.032559979142423e-06, "optim/total_tokens": 2000079028224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2477219104766846, "created_at": "2025-06-03T10:47:00.806886+00:00"} {"global_step": 238429, "acc_step": 0, "speed/wps": 5513.71487981002, "speed/FLOPS": 243677975936484.3, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047430235892534256, "optim/lr": 2.0290127540478763e-06, "optim/total_tokens": 2000087416832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2530345916748047, "created_at": "2025-06-03T10:47:03.787901+00:00"} {"global_step": 238430, "acc_step": 0, "speed/wps": 5524.289316459578, "speed/FLOPS": 244145311911521.47, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04776959866285324, "optim/lr": 2.02546552895333e-06, "optim/total_tokens": 2000095805440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2489572763442993, "created_at": "2025-06-03T10:47:06.758642+00:00"} {"global_step": 238431, "acc_step": 0, "speed/wps": 5511.30535337748, "speed/FLOPS": 243571487201240.34, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047220971435308456, "optim/lr": 2.021918303858783e-06, "optim/total_tokens": 2000104194048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2486401796340942, "created_at": "2025-06-03T10:47:09.739533+00:00"} {"global_step": 238432, "acc_step": 0, "speed/wps": 5514.968725820641, "speed/FLOPS": 243733389512388.1, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04738015681505203, "optim/lr": 2.018371078764458e-06, "optim/total_tokens": 2000112582656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2402558326721191, "created_at": "2025-06-03T10:47:12.717477+00:00"} {"global_step": 238433, "acc_step": 0, "speed/wps": 5510.198363885475, "speed/FLOPS": 243522563931779.6, "speed/curr_iter_time": 2.9724, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9724, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04805157333612442, "optim/lr": 2.0148238536699114e-06, "optim/total_tokens": 2000120971264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2593141794204712, "created_at": "2025-06-03T10:47:15.699984+00:00"} {"global_step": 238434, "acc_step": 0, "speed/wps": 5516.933279264823, "speed/FLOPS": 243820212719124.84, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04932958260178566, "optim/lr": 2.011276628575365e-06, "optim/total_tokens": 2000129359872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2499749660491943, "created_at": "2025-06-03T10:47:18.673724+00:00"} {"global_step": 238435, "acc_step": 0, "speed/wps": 5521.425041273459, "speed/FLOPS": 244018725608984.44, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.47 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.47, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04952271282672882, "optim/lr": 2.007729403480818e-06, "optim/total_tokens": 2000137748480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2469006776809692, "created_at": "2025-06-03T10:47:21.645117+00:00"} {"global_step": 238436, "acc_step": 0, "speed/wps": 5535.050841849597, "speed/FLOPS": 244620916251280.03, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048447828739881516, "optim/lr": 2.0041821783864932e-06, "optim/total_tokens": 2000146137088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2410995960235596, "created_at": "2025-06-03T10:47:24.611712+00:00"} {"global_step": 238437, "acc_step": 0, "speed/wps": 5518.146962539928, "speed/FLOPS": 243873851307690.34, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04741731658577919, "optim/lr": 2.0006349532919464e-06, "optim/total_tokens": 2000154525696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2569290399551392, "created_at": "2025-06-03T10:47:27.586511+00:00"} {"global_step": 238438, "acc_step": 0, "speed/wps": 5514.166542706573, "speed/FLOPS": 243697937124691.66, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05218508467078209, "optim/lr": 1.9970877281973996e-06, "optim/total_tokens": 2000162914304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2551006078720093, "created_at": "2025-06-03T10:47:30.562113+00:00"} {"global_step": 238439, "acc_step": 0, "speed/wps": 5520.350776215878, "speed/FLOPS": 243971248592026.38, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05204065144062042, "optim/lr": 1.9935405031028532e-06, "optim/total_tokens": 2000171302912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2425634860992432, "created_at": "2025-06-03T10:47:33.538439+00:00"} {"global_step": 238440, "acc_step": 0, "speed/wps": 5518.781337716549, "speed/FLOPS": 243901887443470.5, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04826291278004646, "optim/lr": 1.9899932780085283e-06, "optim/total_tokens": 2000179691520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2745296955108643, "created_at": "2025-06-03T10:47:36.511689+00:00"} {"global_step": 238441, "acc_step": 0, "speed/wps": 5518.839692324035, "speed/FLOPS": 243904466418435.44, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04809155315160751, "optim/lr": 1.9864460529139815e-06, "optim/total_tokens": 2000188080128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2487754821777344, "created_at": "2025-06-03T10:47:39.484457+00:00"} {"global_step": 238442, "acc_step": 0, "speed/wps": 5531.01207391714, "speed/FLOPS": 244442423380953.66, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048176176846027374, "optim/lr": 1.9828988278194347e-06, "optim/total_tokens": 2000196468736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.253224492073059, "created_at": "2025-06-03T10:47:42.451097+00:00"} {"global_step": 238443, "acc_step": 0, "speed/wps": 5527.81026905662, "speed/FLOPS": 244300919994441.62, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04758748039603233, "optim/lr": 1.9793516027248883e-06, "optim/total_tokens": 2000204857344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2536734342575073, "created_at": "2025-06-03T10:47:45.423662+00:00"} {"global_step": 238444, "acc_step": 0, "speed/wps": 5521.158722634416, "speed/FLOPS": 244006955688281.12, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04730384796857834, "optim/lr": 1.9758043776305634e-06, "optim/total_tokens": 2000213245952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2634036540985107, "created_at": "2025-06-03T10:47:48.395320+00:00"} {"global_step": 238445, "acc_step": 0, "speed/wps": 5526.469724057375, "speed/FLOPS": 244241674767006.3, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047454241663217545, "optim/lr": 1.9722571525360166e-06, "optim/total_tokens": 2000221634560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.251551628112793, "created_at": "2025-06-03T10:47:51.364037+00:00"} {"global_step": 238446, "acc_step": 0, "speed/wps": 5531.526996816585, "speed/FLOPS": 244465180337494.8, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.46 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.46, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04882017895579338, "optim/lr": 1.9687099274414698e-06, "optim/total_tokens": 2000230023168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2509002685546875, "created_at": "2025-06-03T10:47:54.330190+00:00"} {"global_step": 238447, "acc_step": 0, "speed/wps": 5533.707234865672, "speed/FLOPS": 244561535699794.5, "speed/curr_iter_time": 2.9597, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9597, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047023575752973557, "optim/lr": 1.9651627023469234e-06, "optim/total_tokens": 2000238411776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.240106225013733, "created_at": "2025-06-03T10:47:57.295333+00:00"} {"global_step": 238448, "acc_step": 0, "speed/wps": 5530.594918625212, "speed/FLOPS": 244423987252244.8, "speed/curr_iter_time": 2.96, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.96, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04790681228041649, "optim/lr": 1.9616154772525985e-06, "optim/total_tokens": 2000246800384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2566190958023071, "created_at": "2025-06-03T10:48:00.262707+00:00"} {"global_step": 238449, "acc_step": 0, "speed/wps": 5522.3750811505115, "speed/FLOPS": 244060712508805.25, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0472712367773056, "optim/lr": 1.9580682521580517e-06, "optim/total_tokens": 2000255188992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2756540775299072, "created_at": "2025-06-03T10:48:03.235480+00:00"} {"global_step": 238450, "acc_step": 0, "speed/wps": 5525.122834255528, "speed/FLOPS": 244182149131771.62, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047703634947538376, "optim/lr": 1.954521027063505e-06, "optim/total_tokens": 2000263577600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2542389631271362, "created_at": "2025-06-03T10:48:06.205249+00:00"} {"global_step": 238451, "acc_step": 0, "speed/wps": 5505.209097413818, "speed/FLOPS": 243302063891113.2, "speed/curr_iter_time": 2.9737, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9737, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.97, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047292403876781464, "optim/lr": 1.9509738019689584e-06, "optim/total_tokens": 2000271966208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.26570725440979, "created_at": "2025-06-03T10:48:09.185987+00:00"} {"global_step": 238452, "acc_step": 0, "speed/wps": 5535.5970152610025, "speed/FLOPS": 244645054320495.2, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048345040529966354, "optim/lr": 1.9474265768746336e-06, "optim/total_tokens": 2000280354816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.246289610862732, "created_at": "2025-06-03T10:48:12.150512+00:00"} {"global_step": 238453, "acc_step": 0, "speed/wps": 5518.672195843414, "speed/FLOPS": 243897063931316.66, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04739750176668167, "optim/lr": 1.9438793517800867e-06, "optim/total_tokens": 2000288743424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2584301233291626, "created_at": "2025-06-03T10:48:15.123723+00:00"} {"global_step": 238454, "acc_step": 0, "speed/wps": 5525.194095715248, "speed/FLOPS": 244185298523542.03, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04739603027701378, "optim/lr": 1.94033212668554e-06, "optim/total_tokens": 2000297132032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2422293424606323, "created_at": "2025-06-03T10:48:18.093382+00:00"} {"global_step": 238455, "acc_step": 0, "speed/wps": 5514.93439987185, "speed/FLOPS": 243731872481147.66, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047581300139427185, "optim/lr": 1.9367849015912154e-06, "optim/total_tokens": 2000305520640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2539863586425781, "created_at": "2025-06-03T10:48:21.071932+00:00"} {"global_step": 238456, "acc_step": 0, "speed/wps": 5531.386688498975, "speed/FLOPS": 244458979428019.53, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047119833528995514, "optim/lr": 1.9332376764966686e-06, "optim/total_tokens": 2000313909248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2578325271606445, "created_at": "2025-06-03T10:48:24.041213+00:00"} {"global_step": 238457, "acc_step": 0, "speed/wps": 5521.014253338498, "speed/FLOPS": 244000570884862.4, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0473189502954483, "optim/lr": 1.929690451402122e-06, "optim/total_tokens": 2000322297856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2537641525268555, "created_at": "2025-06-03T10:48:27.013214+00:00"} {"global_step": 238458, "acc_step": 0, "speed/wps": 5518.952061195054, "speed/FLOPS": 243909432547378.44, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0472550168633461, "optim/lr": 1.926143226307575e-06, "optim/total_tokens": 2000330686464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2411465644836426, "created_at": "2025-06-03T10:48:29.991116+00:00"} {"global_step": 238459, "acc_step": 0, "speed/wps": 5503.872721733884, "speed/FLOPS": 243243002926250.88, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.45 hours", "speed/est_time_elapsed_hrs": 197.12, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.45, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047517698258161545, "optim/lr": 1.9225960012132505e-06, "optim/total_tokens": 2000339075072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.259236216545105, "created_at": "2025-06-03T10:48:32.972278+00:00"} {"global_step": 238460, "acc_step": 0, "speed/wps": 5523.647079654869, "speed/FLOPS": 244116928332019.3, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04768289625644684, "optim/lr": 1.9190487761187037e-06, "optim/total_tokens": 2000347463680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2529957294464111, "created_at": "2025-06-03T10:48:35.943556+00:00"} {"global_step": 238461, "acc_step": 0, "speed/wps": 5524.322453557191, "speed/FLOPS": 244146776401624.9, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047260332852602005, "optim/lr": 1.915501551024157e-06, "optim/total_tokens": 2000355852288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2391475439071655, "created_at": "2025-06-03T10:48:38.915454+00:00"} {"global_step": 238462, "acc_step": 0, "speed/wps": 5535.217564997404, "speed/FLOPS": 244628284561046.66, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047750961035490036, "optim/lr": 1.91195432592961e-06, "optim/total_tokens": 2000364240896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2730673551559448, "created_at": "2025-06-03T10:48:41.882515+00:00"} {"global_step": 238463, "acc_step": 0, "speed/wps": 5523.157505745231, "speed/FLOPS": 244095291671079.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047990668565034866, "optim/lr": 1.9084071008352856e-06, "optim/total_tokens": 2000372629504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2584121227264404, "created_at": "2025-06-03T10:48:44.856721+00:00"} {"global_step": 238464, "acc_step": 0, "speed/wps": 5517.599116266423, "speed/FLOPS": 243849639306532.88, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048539821058511734, "optim/lr": 1.9048598757407388e-06, "optim/total_tokens": 2000381018112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2365778684616089, "created_at": "2025-06-03T10:48:47.831164+00:00"} {"global_step": 238465, "acc_step": 0, "speed/wps": 5526.892702654863, "speed/FLOPS": 244260368256014.53, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04717419669032097, "optim/lr": 1.901312650646192e-06, "optim/total_tokens": 2000389406720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2426633834838867, "created_at": "2025-06-03T10:48:50.800031+00:00"} {"global_step": 238466, "acc_step": 0, "speed/wps": 5522.077036689808, "speed/FLOPS": 244047540469171.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04901202768087387, "optim/lr": 1.8977654255516451e-06, "optim/total_tokens": 2000397795328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.255529761314392, "created_at": "2025-06-03T10:48:53.771419+00:00"} {"global_step": 238467, "acc_step": 0, "speed/wps": 5523.010414593427, "speed/FLOPS": 244088790995050.78, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0486440546810627, "optim/lr": 1.8942182004573205e-06, "optim/total_tokens": 2000406183936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2554361820220947, "created_at": "2025-06-03T10:48:56.747451+00:00"} {"global_step": 238468, "acc_step": 0, "speed/wps": 5524.129004319973, "speed/FLOPS": 244138226935502.84, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04906895384192467, "optim/lr": 1.8906709753627739e-06, "optim/total_tokens": 2000414572544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2476893663406372, "created_at": "2025-06-03T10:48:59.718034+00:00"} {"global_step": 238469, "acc_step": 0, "speed/wps": 5528.175121383954, "speed/FLOPS": 244317044599826.28, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048440348356962204, "optim/lr": 1.887123750268227e-06, "optim/total_tokens": 2000422961152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2293859720230103, "created_at": "2025-06-03T10:49:02.686315+00:00"} {"global_step": 238470, "acc_step": 0, "speed/wps": 5537.384731214854, "speed/FLOPS": 244724062215295.66, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 195.93, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04750334471464157, "optim/lr": 1.8835765251736802e-06, "optim/total_tokens": 2000431349760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2547587156295776, "created_at": "2025-06-03T10:49:05.652179+00:00"} {"global_step": 238471, "acc_step": 0, "speed/wps": 5523.611124601725, "speed/FLOPS": 244115339302705.0, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.44 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.44, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047693200409412384, "optim/lr": 1.8800293000793555e-06, "optim/total_tokens": 2000439738368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2555426359176636, "created_at": "2025-06-03T10:49:08.625197+00:00"} {"global_step": 238472, "acc_step": 0, "speed/wps": 5532.613844361569, "speed/FLOPS": 244513213435993.1, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04756636545062065, "optim/lr": 1.876482074984809e-06, "optim/total_tokens": 2000448126976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.262873649597168, "created_at": "2025-06-03T10:49:11.594789+00:00"} {"global_step": 238473, "acc_step": 0, "speed/wps": 5526.547503921084, "speed/FLOPS": 244245112238868.8, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04761110991239548, "optim/lr": 1.8729348498902621e-06, "optim/total_tokens": 2000456515584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2478188276290894, "created_at": "2025-06-03T10:49:14.563571+00:00"} {"global_step": 238474, "acc_step": 0, "speed/wps": 5531.5187313210845, "speed/FLOPS": 244464815044900.34, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04789593443274498, "optim/lr": 1.8693876247957153e-06, "optim/total_tokens": 2000464904192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2597756385803223, "created_at": "2025-06-03T10:49:17.529523+00:00"} {"global_step": 238475, "acc_step": 0, "speed/wps": 5519.235820210417, "speed/FLOPS": 243921973243447.16, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047160856425762177, "optim/lr": 1.8658403997013906e-06, "optim/total_tokens": 2000473292800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2520782947540283, "created_at": "2025-06-03T10:49:20.502196+00:00"} {"global_step": 238476, "acc_step": 0, "speed/wps": 5521.59199825326, "speed/FLOPS": 244026104252928.3, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04845830798149109, "optim/lr": 1.8622931746068438e-06, "optim/total_tokens": 2000481681408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2469022274017334, "created_at": "2025-06-03T10:49:23.474112+00:00"} {"global_step": 238477, "acc_step": 0, "speed/wps": 5532.239869478476, "speed/FLOPS": 244496685660337.34, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04785739630460739, "optim/lr": 1.8587459495122972e-06, "optim/total_tokens": 2000490070016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.256290078163147, "created_at": "2025-06-03T10:49:26.439963+00:00"} {"global_step": 238478, "acc_step": 0, "speed/wps": 5529.535320246405, "speed/FLOPS": 244377158427417.7, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05678718164563179, "optim/lr": 1.8551987244177504e-06, "optim/total_tokens": 2000498458624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.272377848625183, "created_at": "2025-06-03T10:49:29.408803+00:00"} {"global_step": 238479, "acc_step": 0, "speed/wps": 5517.228195757223, "speed/FLOPS": 243833246518569.5, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04848724603652954, "optim/lr": 1.8516514993234257e-06, "optim/total_tokens": 2000506847232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.257654070854187, "created_at": "2025-06-03T10:49:32.382876+00:00"} {"global_step": 238480, "acc_step": 0, "speed/wps": 5536.174149908243, "speed/FLOPS": 244670560717860.28, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049566011875867844, "optim/lr": 1.8481042742288789e-06, "optim/total_tokens": 2000515235840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2403979301452637, "created_at": "2025-06-03T10:49:35.351124+00:00"} {"global_step": 238481, "acc_step": 0, "speed/wps": 5526.937749233152, "speed/FLOPS": 244262359084205.66, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04921058192849159, "optim/lr": 1.8445570491343323e-06, "optim/total_tokens": 2000523624448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2408868074417114, "created_at": "2025-06-03T10:49:38.323154+00:00"} {"global_step": 238482, "acc_step": 0, "speed/wps": 5526.386588921477, "speed/FLOPS": 244238000619523.78, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04708477482199669, "optim/lr": 1.8410098240400076e-06, "optim/total_tokens": 2000532013056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2423440217971802, "created_at": "2025-06-03T10:49:41.292122+00:00"} {"global_step": 238483, "acc_step": 0, "speed/wps": 5506.644968654035, "speed/FLOPS": 243365522050475.53, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 197.03, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04749481379985809, "optim/lr": 1.8374625989454608e-06, "optim/total_tokens": 2000540401664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2456028461456299, "created_at": "2025-06-03T10:49:44.272620+00:00"} {"global_step": 238484, "acc_step": 0, "speed/wps": 5523.5228913259525, "speed/FLOPS": 244111439843534.7, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.43 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.43, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04708688706159592, "optim/lr": 1.833915373850914e-06, "optim/total_tokens": 2000548790272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2365151643753052, "created_at": "2025-06-03T10:49:47.247426+00:00"} {"global_step": 238485, "acc_step": 0, "speed/wps": 5513.189413471725, "speed/FLOPS": 243654753013912.22, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04842903092503548, "optim/lr": 1.8303681487563673e-06, "optim/total_tokens": 2000557178880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2597092390060425, "created_at": "2025-06-03T10:49:50.228376+00:00"} {"global_step": 238486, "acc_step": 0, "speed/wps": 5525.067206347066, "speed/FLOPS": 244179690662947.03, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047079332172870636, "optim/lr": 1.8268209236620427e-06, "optim/total_tokens": 2000565567488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.250244379043579, "created_at": "2025-06-03T10:49:53.203669+00:00"} {"global_step": 238487, "acc_step": 0, "speed/wps": 5522.582802563165, "speed/FLOPS": 244069892732029.97, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04795756936073303, "optim/lr": 1.8232736985674958e-06, "optim/total_tokens": 2000573956096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2415027618408203, "created_at": "2025-06-03T10:49:56.177855+00:00"} {"global_step": 238488, "acc_step": 0, "speed/wps": 5526.870471565908, "speed/FLOPS": 244259385755671.75, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04792345315217972, "optim/lr": 1.819726473472949e-06, "optim/total_tokens": 2000582344704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2536276578903198, "created_at": "2025-06-03T10:49:59.147211+00:00"} {"global_step": 238489, "acc_step": 0, "speed/wps": 5524.198400085874, "speed/FLOPS": 244141293873155.94, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04905030503869057, "optim/lr": 1.8161792483784024e-06, "optim/total_tokens": 2000590733312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2744337320327759, "created_at": "2025-06-03T10:50:02.117045+00:00"} {"global_step": 238490, "acc_step": 0, "speed/wps": 5528.549560247973, "speed/FLOPS": 244333592881064.06, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047348134219646454, "optim/lr": 1.8126320232840775e-06, "optim/total_tokens": 2000599121920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.250591516494751, "created_at": "2025-06-03T10:50:05.085107+00:00"} {"global_step": 238491, "acc_step": 0, "speed/wps": 5522.688987125106, "speed/FLOPS": 244074585546165.88, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047155894339084625, "optim/lr": 1.809084798189531e-06, "optim/total_tokens": 2000607510528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2563923597335815, "created_at": "2025-06-03T10:50:08.055910+00:00"} {"global_step": 238492, "acc_step": 0, "speed/wps": 5512.721289225342, "speed/FLOPS": 243634064318299.2, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04696264490485191, "optim/lr": 1.805537573094984e-06, "optim/total_tokens": 2000615899136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2503825426101685, "created_at": "2025-06-03T10:50:11.035328+00:00"} {"global_step": 238493, "acc_step": 0, "speed/wps": 5518.592990294058, "speed/FLOPS": 243893563451445.88, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047236520797014236, "optim/lr": 1.8019903480004373e-06, "optim/total_tokens": 2000624287744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.248480200767517, "created_at": "2025-06-03T10:50:14.008988+00:00"} {"global_step": 238494, "acc_step": 0, "speed/wps": 5532.469903280571, "speed/FLOPS": 244506851976970.22, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0473899208009243, "optim/lr": 1.7984431229061126e-06, "optim/total_tokens": 2000632676352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2256733179092407, "created_at": "2025-06-03T10:50:16.974603+00:00"} {"global_step": 238495, "acc_step": 0, "speed/wps": 5519.489378015352, "speed/FLOPS": 243933179200598.78, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.42 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.42, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047304417937994, "optim/lr": 1.794895897811566e-06, "optim/total_tokens": 2000641064960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2610530853271484, "created_at": "2025-06-03T10:50:19.950968+00:00"} {"global_step": 238496, "acc_step": 0, "speed/wps": 5532.360187132607, "speed/FLOPS": 244502003084808.38, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.41 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.41, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04859769716858864, "optim/lr": 1.7913486727170192e-06, "optim/total_tokens": 2000649453568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.257464051246643, "created_at": "2025-06-03T10:50:22.917016+00:00"} {"global_step": 238497, "acc_step": 0, "speed/wps": 5532.610434899138, "speed/FLOPS": 244513062755204.88, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.41 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.41, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0653916597366333, "optim/lr": 1.7878014476224724e-06, "optim/total_tokens": 2000657842176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.253113031387329, "created_at": "2025-06-03T10:50:25.883309+00:00"} {"global_step": 238498, "acc_step": 0, "speed/wps": 5533.609803016878, "speed/FLOPS": 244557229710779.22, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.41 hours", "speed/est_time_elapsed_hrs": 196.01, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.41, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047054827213287354, "optim/lr": 1.7842542225281477e-06, "optim/total_tokens": 2000666230784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.2565425634384155, "created_at": "2025-06-03T10:50:28.851109+00:00"} {"global_step": 238499, "acc_step": 0, "speed/wps": 5532.113061190793, "speed/FLOPS": 244491081383085.4, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.41 hours", "speed/est_time_elapsed_hrs": 196.15, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.41, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04777801036834717, "optim/lr": 1.780706997433601e-06, "optim/total_tokens": 2000674619392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2579388618469238, "created_at": "2025-06-03T10:50:31.822700+00:00"} {"global_step": 238500, "acc_step": 0, "speed/wps": 5510.5947142386785, "speed/FLOPS": 243540080588686.16, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.41 hours", "speed/est_time_elapsed_hrs": 196.9, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.41, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04752769693732262, "optim/lr": 1.7771597723390542e-06, "optim/total_tokens": 2000683008000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2532089948654175, "created_at": "2025-06-03T10:50:34.800238+00:00"} {"global_step": 238501, "acc_step": 0, "speed/wps": 246.44605529772582, "speed/FLOPS": 10891654218897.498, "speed/curr_iter_time": 2.8791, "speed/data_load_time": 0.0019, "speed/curr_step_time": 2.8791, "speed/est_time_elapsed": "7.95 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 190.74, "speed/est_time_elapsed_days": 7.95, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04678856581449509, "optim/lr": 1.7736125472445074e-06, "optim/total_tokens": 2000691396608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2555091381072998, "created_at": "2025-06-03T10:51:41.289219+00:00"} {"global_step": 238502, "acc_step": 0, "speed/wps": 5626.892777100815, "speed/FLOPS": 248679859699744.56, "speed/curr_iter_time": 2.9104, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9104, "speed/est_time_elapsed": "8.03 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 192.82, "speed/est_time_elapsed_days": 8.03, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0472506619989872, "optim/lr": 1.7700653221501827e-06, "optim/total_tokens": 2000699785216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2503938674926758, "created_at": "2025-06-03T10:51:44.210060+00:00"} {"global_step": 238503, "acc_step": 0, "speed/wps": 5599.343861112759, "speed/FLOPS": 247462338621207.25, "speed/curr_iter_time": 2.9249, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9249, "speed/est_time_elapsed": "8.07 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 193.78, "speed/est_time_elapsed_days": 8.07, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.046949245035648346, "optim/lr": 1.7665180970556361e-06, "optim/total_tokens": 2000708173824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2501306533813477, "created_at": "2025-06-03T10:51:47.143776+00:00"} {"global_step": 238504, "acc_step": 0, "speed/wps": 5569.565721751981, "speed/FLOPS": 246146297279795.16, "speed/curr_iter_time": 2.9391, "speed/data_load_time": 0.0008, "speed/curr_step_time": 2.9391, "speed/est_time_elapsed": "8.11 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 194.72, "speed/est_time_elapsed_days": 8.11, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049844857305288315, "optim/lr": 1.7629708719610893e-06, "optim/total_tokens": 2000716562432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2522600889205933, "created_at": "2025-06-03T10:51:50.094072+00:00"} {"global_step": 238505, "acc_step": 0, "speed/wps": 5582.843929468427, "speed/FLOPS": 246733126096833.84, "speed/curr_iter_time": 2.9336, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9336, "speed/est_time_elapsed": "8.1 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 194.36, "speed/est_time_elapsed_days": 8.1, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049208272248506546, "optim/lr": 1.7594236468665425e-06, "optim/total_tokens": 2000724951040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2495193481445312, "created_at": "2025-06-03T10:51:53.038006+00:00"} {"global_step": 238506, "acc_step": 0, "speed/wps": 5565.465271657825, "speed/FLOPS": 245965078373639.62, "speed/curr_iter_time": 2.9428, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9428, "speed/est_time_elapsed": "8.12 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 194.97, "speed/est_time_elapsed_days": 8.12, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04753937944769859, "optim/lr": 1.7558764217722178e-06, "optim/total_tokens": 2000733339648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2576032876968384, "created_at": "2025-06-03T10:51:55.991008+00:00"} {"global_step": 238507, "acc_step": 0, "speed/wps": 5555.1268826663845, "speed/FLOPS": 245508174496889.84, "speed/curr_iter_time": 2.9469, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9469, "speed/est_time_elapsed": "8.13 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.24, "speed/est_time_elapsed_days": 8.13, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048835575580596924, "optim/lr": 1.752329196677671e-06, "optim/total_tokens": 2000741728256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2598785161972046, "created_at": "2025-06-03T10:51:58.944811+00:00"} {"global_step": 238508, "acc_step": 0, "speed/wps": 5555.464699669674, "speed/FLOPS": 245523104279331.06, "speed/curr_iter_time": 2.9481, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9481, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.32, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05910966917872429, "optim/lr": 1.7487819715831244e-06, "optim/total_tokens": 2000750116864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.245522379875183, "created_at": "2025-06-03T10:52:01.901205+00:00"} {"global_step": 238509, "acc_step": 0, "speed/wps": 5546.50985390088, "speed/FLOPS": 245127345931406.1, "speed/curr_iter_time": 2.9529, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9529, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.64, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048516593873500824, "optim/lr": 1.7452347464887997e-06, "optim/total_tokens": 2000758505472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2309458255767822, "created_at": "2025-06-03T10:52:04.859435+00:00"} {"global_step": 238510, "acc_step": 0, "speed/wps": 5541.924884468374, "speed/FLOPS": 244924713750490.28, "speed/curr_iter_time": 2.9553, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9553, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.8, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04755097255110741, "optim/lr": 1.741687521394253e-06, "optim/total_tokens": 2000766894080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2483243942260742, "created_at": "2025-06-03T10:52:07.824726+00:00"} {"global_step": 238511, "acc_step": 0, "speed/wps": 5523.2758055484, "speed/FLOPS": 244100519916866.5, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04746881127357483, "optim/lr": 1.738140296299706e-06, "optim/total_tokens": 2000775282688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2408188581466675, "created_at": "2025-06-03T10:52:10.796098+00:00"} {"global_step": 238512, "acc_step": 0, "speed/wps": 5529.76809538295, "speed/FLOPS": 244387445897001.84, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.0470740832388401, "optim/lr": 1.7345930712051595e-06, "optim/total_tokens": 2000783671296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2560888528823853, "created_at": "2025-06-03T10:52:13.769886+00:00"} {"global_step": 238513, "acc_step": 0, "speed/wps": 5525.729507163502, "speed/FLOPS": 244208960969070.62, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048246439546346664, "optim/lr": 1.7310458461108348e-06, "optim/total_tokens": 2000792059904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2554042339324951, "created_at": "2025-06-03T10:52:16.743951+00:00"} {"global_step": 238514, "acc_step": 0, "speed/wps": 5541.574188142936, "speed/FLOPS": 244909214767932.44, "speed/curr_iter_time": 2.9543, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9543, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.73, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.050296127796173096, "optim/lr": 1.727498621016288e-06, "optim/total_tokens": 2000800448512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.236449122428894, "created_at": "2025-06-03T10:52:19.705215+00:00"} {"global_step": 238515, "acc_step": 0, "speed/wps": 5551.810369083761, "speed/FLOPS": 245361601571993.25, "speed/curr_iter_time": 2.9501, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9501, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.46, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04957708716392517, "optim/lr": 1.7239513959217412e-06, "optim/total_tokens": 2000808837120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2510366439819336, "created_at": "2025-06-03T10:52:22.660877+00:00"} {"global_step": 238516, "acc_step": 0, "speed/wps": 5554.789560577235, "speed/FLOPS": 245493266587120.38, "speed/curr_iter_time": 2.9485, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9485, "speed/est_time_elapsed": "8.14 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.35, "speed/est_time_elapsed_days": 8.14, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04830305278301239, "optim/lr": 1.7204041708271945e-06, "optim/total_tokens": 2000817225728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.239790678024292, "created_at": "2025-06-03T10:52:25.615044+00:00"} {"global_step": 238517, "acc_step": 0, "speed/wps": 5540.78971341599, "speed/FLOPS": 244874545000307.1, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04805070534348488, "optim/lr": 1.7168569457328699e-06, "optim/total_tokens": 2000825614336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2402729988098145, "created_at": "2025-06-03T10:52:28.579724+00:00"} {"global_step": 238518, "acc_step": 0, "speed/wps": 5531.675074207707, "speed/FLOPS": 244471724600253.62, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.17, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04834460839629173, "optim/lr": 1.713309720638323e-06, "optim/total_tokens": 2000834002944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2497352361679077, "created_at": "2025-06-03T10:52:31.546069+00:00"} {"global_step": 238519, "acc_step": 0, "speed/wps": 5530.216511911354, "speed/FLOPS": 244407263612353.44, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047425370663404465, "optim/lr": 1.7097624955437762e-06, "optim/total_tokens": 2000842391552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2518188953399658, "created_at": "2025-06-03T10:52:34.516396+00:00"} {"global_step": 238520, "acc_step": 0, "speed/wps": 5526.457305298103, "speed/FLOPS": 244241125921411.47, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.4 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.4, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04680312052369118, "optim/lr": 1.7062152704492296e-06, "optim/total_tokens": 2000850780160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2330480813980103, "created_at": "2025-06-03T10:52:37.490678+00:00"} {"global_step": 238521, "acc_step": 0, "speed/wps": 5530.355097949544, "speed/FLOPS": 244413388405893.78, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04760691896080971, "optim/lr": 1.7026680453549047e-06, "optim/total_tokens": 2000859168768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2604032754898071, "created_at": "2025-06-03T10:52:40.461737+00:00"} {"global_step": 238522, "acc_step": 0, "speed/wps": 5544.841267689841, "speed/FLOPS": 245053602961476.56, "speed/curr_iter_time": 2.9538, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9538, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.71, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04791298508644104, "optim/lr": 1.6991208202603581e-06, "optim/total_tokens": 2000867557376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2412816286087036, "created_at": "2025-06-03T10:52:43.426200+00:00"} {"global_step": 238523, "acc_step": 0, "speed/wps": 5543.813604282757, "speed/FLOPS": 245008185498941.66, "speed/curr_iter_time": 2.9544, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9544, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.75, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04785192012786865, "optim/lr": 1.6955735951658113e-06, "optim/total_tokens": 2000875945984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2313605546951294, "created_at": "2025-06-03T10:52:46.389625+00:00"} {"global_step": 238524, "acc_step": 0, "speed/wps": 5541.148702468658, "speed/FLOPS": 244890410478962.44, "speed/curr_iter_time": 2.9545, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9545, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.76, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04788465425372124, "optim/lr": 1.6920263700712645e-06, "optim/total_tokens": 2000884334592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.266958475112915, "created_at": "2025-06-03T10:52:49.351634+00:00"} {"global_step": 238525, "acc_step": 0, "speed/wps": 5537.515237764872, "speed/FLOPS": 244729829936813.38, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04766954109072685, "optim/lr": 1.6884791449769398e-06, "optim/total_tokens": 2000892723200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2467716932296753, "created_at": "2025-06-03T10:52:52.315039+00:00"} {"global_step": 238526, "acc_step": 0, "speed/wps": 5535.674365513698, "speed/FLOPS": 244648472805749.84, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 196.04, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04754215106368065, "optim/lr": 1.6849319198823932e-06, "optim/total_tokens": 2000901111808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 420, "loss/out": 1.2562414407730103, "created_at": "2025-06-03T10:52:55.279342+00:00"} {"global_step": 238527, "acc_step": 0, "speed/wps": 5539.3282663492055, "speed/FLOPS": 244809956520319.4, "speed/curr_iter_time": 2.9568, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9568, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.91, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04714832082390785, "optim/lr": 1.6813846947878464e-06, "optim/total_tokens": 2000909500416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2540299892425537, "created_at": "2025-06-03T10:52:58.246524+00:00"} {"global_step": 238528, "acc_step": 0, "speed/wps": 5526.750452038764, "speed/FLOPS": 244254081506887.62, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04700550064444542, "optim/lr": 1.6778374696932996e-06, "optim/total_tokens": 2000917889024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.245963454246521, "created_at": "2025-06-03T10:53:01.216633+00:00"} {"global_step": 238529, "acc_step": 0, "speed/wps": 5527.0789280936015, "speed/FLOPS": 244268598467218.6, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04714803770184517, "optim/lr": 1.6742902445989749e-06, "optim/total_tokens": 2000926277632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.2474066019058228, "created_at": "2025-06-03T10:53:04.188530+00:00"} {"global_step": 238530, "acc_step": 0, "speed/wps": 5527.680540433927, "speed/FLOPS": 244295186653329.84, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04782178997993469, "optim/lr": 1.6707430195044283e-06, "optim/total_tokens": 2000934666240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2791508436203003, "created_at": "2025-06-03T10:53:07.159985+00:00"} {"global_step": 238531, "acc_step": 0, "speed/wps": 5535.195266451754, "speed/FLOPS": 244627299079463.22, "speed/curr_iter_time": 2.9577, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9577, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.39 hours", "speed/est_time_elapsed_hrs": 195.97, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.39, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05226357653737068, "optim/lr": 1.6671957944098815e-06, "optim/total_tokens": 2000943054848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.252483606338501, "created_at": "2025-06-03T10:53:10.129637+00:00"} {"global_step": 238532, "acc_step": 0, "speed/wps": 5545.3622425527, "speed/FLOPS": 245076627383823.88, "speed/curr_iter_time": 2.9535, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9535, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 195.7, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047961585223674774, "optim/lr": 1.6636485693153346e-06, "optim/total_tokens": 2000951443456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2384235858917236, "created_at": "2025-06-03T10:53:13.092734+00:00"} {"global_step": 238533, "acc_step": 0, "speed/wps": 5532.93149784931, "speed/FLOPS": 244527252094253.3, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.08873944729566574, "optim/lr": 1.66010134422101e-06, "optim/total_tokens": 2000959832064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2553492784500122, "created_at": "2025-06-03T10:53:16.063797+00:00"} {"global_step": 238534, "acc_step": 0, "speed/wps": 5524.361601624537, "speed/FLOPS": 244148506545823.62, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047958455979824066, "optim/lr": 1.6565541191264633e-06, "optim/total_tokens": 2000968220672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2704989910125732, "created_at": "2025-06-03T10:53:19.034064+00:00"} {"global_step": 238535, "acc_step": 0, "speed/wps": 5533.572358761423, "speed/FLOPS": 244555574866345.2, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04813002049922943, "optim/lr": 1.6530068940319165e-06, "optim/total_tokens": 2000976609280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2602545022964478, "created_at": "2025-06-03T10:53:22.003830+00:00"} {"global_step": 238536, "acc_step": 0, "speed/wps": 5526.35766254143, "speed/FLOPS": 244236722221584.34, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.37, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049379609525203705, "optim/lr": 1.6494596689375918e-06, "optim/total_tokens": 2000984997888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.2579411268234253, "created_at": "2025-06-03T10:53:24.973041+00:00"} {"global_step": 238537, "acc_step": 0, "speed/wps": 5523.557391474124, "speed/FLOPS": 244112964573496.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048103805631399155, "optim/lr": 1.645912443843045e-06, "optim/total_tokens": 2000993386496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2508937120437622, "created_at": "2025-06-03T10:53:27.945301+00:00"} {"global_step": 238538, "acc_step": 0, "speed/wps": 5531.136906184924, "speed/FLOPS": 244447940328240.25, "speed/curr_iter_time": 2.9598, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9598, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.048245225101709366, "optim/lr": 1.6423652187484982e-06, "optim/total_tokens": 2001001775104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2589219808578491, "created_at": "2025-06-03T10:53:30.912462+00:00"} {"global_step": 238539, "acc_step": 0, "speed/wps": 5535.746405013672, "speed/FLOPS": 244651656582917.12, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.05, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.046973809599876404, "optim/lr": 1.6388179936539516e-06, "optim/total_tokens": 2001010163712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2625614404678345, "created_at": "2025-06-03T10:53:33.880502+00:00"} {"global_step": 238540, "acc_step": 0, "speed/wps": 5522.090658651592, "speed/FLOPS": 244048142490159.3, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04800224304199219, "optim/lr": 1.635270768559627e-06, "optim/total_tokens": 2001018552320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2605881690979004, "created_at": "2025-06-03T10:53:36.855296+00:00"} {"global_step": 238541, "acc_step": 0, "speed/wps": 5530.286919529178, "speed/FLOPS": 244410375268682.38, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04782719910144806, "optim/lr": 1.6317235434650801e-06, "optim/total_tokens": 2001026940928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2634222507476807, "created_at": "2025-06-03T10:53:39.822138+00:00"} {"global_step": 238542, "acc_step": 0, "speed/wps": 5527.9176170417395, "speed/FLOPS": 244305664225927.1, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047875840216875076, "optim/lr": 1.6281763183705333e-06, "optim/total_tokens": 2001035329536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2527873516082764, "created_at": "2025-06-03T10:53:42.794210+00:00"} {"global_step": 238543, "acc_step": 0, "speed/wps": 5518.017696166024, "speed/FLOPS": 243868138395609.06, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04783037304878235, "optim/lr": 1.6246290932759867e-06, "optim/total_tokens": 2001043718144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2419390678405762, "created_at": "2025-06-03T10:53:45.767856+00:00"} {"global_step": 238544, "acc_step": 0, "speed/wps": 5525.3820852949775, "speed/FLOPS": 244193606700748.2, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04757297784090042, "optim/lr": 1.621081868181662e-06, "optim/total_tokens": 2001052106752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2605031728744507, "created_at": "2025-06-03T10:53:48.737600+00:00"} {"global_step": 238545, "acc_step": 0, "speed/wps": 5518.123668035571, "speed/FLOPS": 243872821809829.88, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.38 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.38, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.049339406192302704, "optim/lr": 1.6175346430871152e-06, "optim/total_tokens": 2001060495360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2591657638549805, "created_at": "2025-06-03T10:53:51.711150+00:00"} {"global_step": 238546, "acc_step": 0, "speed/wps": 5530.28167794671, "speed/FLOPS": 244410143617566.16, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047526970505714417, "optim/lr": 1.6139874179925684e-06, "optim/total_tokens": 2001068883968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2404061555862427, "created_at": "2025-06-03T10:53:54.682509+00:00"} {"global_step": 238547, "acc_step": 0, "speed/wps": 5527.575163803939, "speed/FLOPS": 244290529545650.88, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04678132012486458, "optim/lr": 1.6104401928980218e-06, "optim/total_tokens": 2001077272576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2561489343643188, "created_at": "2025-06-03T10:53:57.654855+00:00"} {"global_step": 238548, "acc_step": 0, "speed/wps": 5539.487313793862, "speed/FLOPS": 244816985603294.6, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 195.82, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04707185924053192, "optim/lr": 1.606892967803697e-06, "optim/total_tokens": 2001085661184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2475948333740234, "created_at": "2025-06-03T10:54:00.623523+00:00"} {"global_step": 238549, "acc_step": 0, "speed/wps": 5540.941234368535, "speed/FLOPS": 244881241450855.03, "speed/curr_iter_time": 2.9559, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9559, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 195.87, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04805188626050949, "optim/lr": 1.6033457427091503e-06, "optim/total_tokens": 2001094049792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.263966679573059, "created_at": "2025-06-03T10:54:03.588627+00:00"} {"global_step": 238550, "acc_step": 0, "speed/wps": 5532.111167145742, "speed/FLOPS": 244490997675988.75, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047164496034383774, "optim/lr": 1.5997985176146034e-06, "optim/total_tokens": 2001102438400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2418506145477295, "created_at": "2025-06-03T10:54:06.554989+00:00"} {"global_step": 238551, "acc_step": 0, "speed/wps": 5529.831279712126, "speed/FLOPS": 244390238320944.7, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04768892377614975, "optim/lr": 1.5962512925200568e-06, "optim/total_tokens": 2001110827008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2381600141525269, "created_at": "2025-06-03T10:54:09.522198+00:00"} {"global_step": 238552, "acc_step": 0, "speed/wps": 5538.25589376202, "speed/FLOPS": 244762563140866.25, "speed/curr_iter_time": 2.9573, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9573, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 195.96, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04798901453614235, "optim/lr": 1.592704067425732e-06, "optim/total_tokens": 2001119215616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2329257726669312, "created_at": "2025-06-03T10:54:12.485346+00:00"} {"global_step": 238553, "acc_step": 0, "speed/wps": 5529.80897456909, "speed/FLOPS": 244389252547790.6, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.05055968090891838, "optim/lr": 1.5891568423311853e-06, "optim/total_tokens": 2001127604224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.243405818939209, "created_at": "2025-06-03T10:54:15.456841+00:00"} {"global_step": 238554, "acc_step": 0, "speed/wps": 5530.109035943723, "speed/FLOPS": 244402513724696.0, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047392576932907104, "optim/lr": 1.5856096172366385e-06, "optim/total_tokens": 2001135992832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2631474733352661, "created_at": "2025-06-03T10:54:18.423595+00:00"} {"global_step": 238555, "acc_step": 0, "speed/wps": 5526.033628704921, "speed/FLOPS": 244222401584566.22, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.046991921961307526, "optim/lr": 1.5820623921420917e-06, "optim/total_tokens": 2001144381440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.244995355606079, "created_at": "2025-06-03T10:54:21.392609+00:00"} {"global_step": 238556, "acc_step": 0, "speed/wps": 5512.399403918865, "speed/FLOPS": 243619838635311.25, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.37 hours", "speed/est_time_elapsed_hrs": 196.89, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.37, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04895170032978058, "optim/lr": 1.578515167047767e-06, "optim/total_tokens": 2001152770048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.229259967803955, "created_at": "2025-06-03T10:54:24.371295+00:00"} {"global_step": 238557, "acc_step": 0, "speed/wps": 5537.302974553357, "speed/FLOPS": 244720448989326.03, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.0, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.046941448003053665, "optim/lr": 1.5749679419532204e-06, "optim/total_tokens": 2001161158656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2653740644454956, "created_at": "2025-06-03T10:54:27.337311+00:00"} {"global_step": 238558, "acc_step": 0, "speed/wps": 5527.119001293474, "speed/FLOPS": 244270369497539.72, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047085076570510864, "optim/lr": 1.5714207168586736e-06, "optim/total_tokens": 2001169547264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2550982236862183, "created_at": "2025-06-03T10:54:30.307945+00:00"} {"global_step": 238559, "acc_step": 0, "speed/wps": 5531.239357839199, "speed/FLOPS": 244452468166964.12, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04728437215089798, "optim/lr": 1.5678734917641268e-06, "optim/total_tokens": 2001177935872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2742904424667358, "created_at": "2025-06-03T10:54:33.277844+00:00"} {"global_step": 238560, "acc_step": 0, "speed/wps": 5529.605307286707, "speed/FLOPS": 244380251496372.9, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047703176736831665, "optim/lr": 1.564326266669802e-06, "optim/total_tokens": 2001186324480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.240127444267273, "created_at": "2025-06-03T10:54:36.246688+00:00"} {"global_step": 238561, "acc_step": 0, "speed/wps": 5535.778355379887, "speed/FLOPS": 244653068625567.03, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.047733090817928314, "optim/lr": 1.5607790415752555e-06, "optim/total_tokens": 2001194713088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2560858726501465, "created_at": "2025-06-03T10:54:39.210535+00:00"} {"global_step": 238562, "acc_step": 0, "speed/wps": 5526.481440181227, "speed/FLOPS": 244242192559712.0, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04885075241327286, "optim/lr": 1.5572318164807087e-06, "optim/total_tokens": 2001203101696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2508527040481567, "created_at": "2025-06-03T10:54:42.184962+00:00"} {"global_step": 238563, "acc_step": 0, "speed/wps": 5515.684734371534, "speed/FLOPS": 243765033425473.6, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.02, "optim/grad_norm": 0.04757186397910118, "optim/lr": 1.553684591386384e-06, "optim/total_tokens": 2001211490304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.2460556030273438, "created_at": "2025-06-03T10:54:45.165071+00:00"} {"global_step": 238564, "acc_step": 0, "speed/wps": 5525.189633387688, "speed/FLOPS": 244185101311504.16, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04682476073503494, "optim/lr": 1.5501373662918372e-06, "optim/total_tokens": 2001219878912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2512205839157104, "created_at": "2025-06-03T10:54:48.135155+00:00"} {"global_step": 238565, "acc_step": 0, "speed/wps": 5516.651246432507, "speed/FLOPS": 243807748311511.38, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04865206032991409, "optim/lr": 1.5465901411972906e-06, "optim/total_tokens": 2001228267520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2589588165283203, "created_at": "2025-06-03T10:54:51.109531+00:00"} {"global_step": 238566, "acc_step": 0, "speed/wps": 5532.246821888712, "speed/FLOPS": 244496992921284.1, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047254398465156555, "optim/lr": 1.5430429161027437e-06, "optim/total_tokens": 2001236656128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2381192445755005, "created_at": "2025-06-03T10:54:54.074815+00:00"} {"global_step": 238567, "acc_step": 0, "speed/wps": 5525.034632497239, "speed/FLOPS": 244178251065512.75, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0470028854906559, "optim/lr": 1.539495691008419e-06, "optim/total_tokens": 2001245044736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2481868267059326, "created_at": "2025-06-03T10:54:57.047030+00:00"} {"global_step": 238568, "acc_step": 0, "speed/wps": 5530.016719771835, "speed/FLOPS": 244398433822415.53, "speed/curr_iter_time": 2.9604, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9604, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047316860407590866, "optim/lr": 1.5359484659138722e-06, "optim/total_tokens": 2001253433344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2472749948501587, "created_at": "2025-06-03T10:55:00.017464+00:00"} {"global_step": 238569, "acc_step": 0, "speed/wps": 5519.601834390306, "speed/FLOPS": 243938149196767.88, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.36 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.36, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04908657446503639, "optim/lr": 1.5324012408193254e-06, "optim/total_tokens": 2001261821952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2543283700942993, "created_at": "2025-06-03T10:55:02.993062+00:00"} {"global_step": 238570, "acc_step": 0, "speed/wps": 5515.8133488581225, "speed/FLOPS": 243770717527472.16, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04849366471171379, "optim/lr": 1.5288540157247788e-06, "optim/total_tokens": 2001270210560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2502789497375488, "created_at": "2025-06-03T10:55:05.972647+00:00"} {"global_step": 238571, "acc_step": 0, "speed/wps": 5509.396735319492, "speed/FLOPS": 243487136052270.1, "speed/curr_iter_time": 2.9717, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9717, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047751542180776596, "optim/lr": 1.5253067906304541e-06, "optim/total_tokens": 2001278599168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.233422875404358, "created_at": "2025-06-03T10:55:08.952377+00:00"} {"global_step": 238572, "acc_step": 0, "speed/wps": 5520.67543980088, "speed/FLOPS": 243985597060704.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047005411237478256, "optim/lr": 1.5217595655359073e-06, "optim/total_tokens": 2001286987776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.255170464515686, "created_at": "2025-06-03T10:55:11.928221+00:00"} {"global_step": 238573, "acc_step": 0, "speed/wps": 5520.674193292156, "speed/FLOPS": 243985541971399.2, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04754190146923065, "optim/lr": 1.5182123404413605e-06, "optim/total_tokens": 2001295376384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2533648014068604, "created_at": "2025-06-03T10:55:14.903675+00:00"} {"global_step": 238574, "acc_step": 0, "speed/wps": 5531.33950367664, "speed/FLOPS": 244456894100386.12, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04930220916867256, "optim/lr": 1.5146651153468139e-06, "optim/total_tokens": 2001303764992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2489193677902222, "created_at": "2025-06-03T10:55:17.870094+00:00"} {"global_step": 238575, "acc_step": 0, "speed/wps": 5514.881321657101, "speed/FLOPS": 243729526695734.7, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048743344843387604, "optim/lr": 1.5111178902524892e-06, "optim/total_tokens": 2001312153600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2603986263275146, "created_at": "2025-06-03T10:55:20.845069+00:00"} {"global_step": 238576, "acc_step": 0, "speed/wps": 5531.519268757991, "speed/FLOPS": 244464838796860.75, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04738606885075569, "optim/lr": 1.5075706651579424e-06, "optim/total_tokens": 2001320542208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.257215976715088, "created_at": "2025-06-03T10:55:23.811860+00:00"} {"global_step": 238577, "acc_step": 0, "speed/wps": 5531.543250029579, "speed/FLOPS": 244465898646317.7, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04682566225528717, "optim/lr": 1.5040234400633956e-06, "optim/total_tokens": 2001328930816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2614086866378784, "created_at": "2025-06-03T10:55:26.778077+00:00"} {"global_step": 238578, "acc_step": 0, "speed/wps": 5523.4503484668985, "speed/FLOPS": 244108233820472.5, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04688854143023491, "optim/lr": 1.500476214968849e-06, "optim/total_tokens": 2001337319424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2533233165740967, "created_at": "2025-06-03T10:55:29.748534+00:00"} {"global_step": 238579, "acc_step": 0, "speed/wps": 5517.046202034409, "speed/FLOPS": 243825203327549.44, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.75, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04677189141511917, "optim/lr": 1.4969289898745243e-06, "optim/total_tokens": 2001345708032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2583506107330322, "created_at": "2025-06-03T10:55:32.722761+00:00"} {"global_step": 238580, "acc_step": 0, "speed/wps": 5527.579906571266, "speed/FLOPS": 244290739151691.06, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.35 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.35, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047977201640605927, "optim/lr": 1.4933817647799775e-06, "optim/total_tokens": 2001354096640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.261189341545105, "created_at": "2025-06-03T10:55:35.693012+00:00"} {"global_step": 238581, "acc_step": 0, "speed/wps": 5526.912830728458, "speed/FLOPS": 244261257813842.62, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046830564737319946, "optim/lr": 1.4898345396854306e-06, "optim/total_tokens": 2001362485248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2663228511810303, "created_at": "2025-06-03T10:55:38.665824+00:00"} {"global_step": 238582, "acc_step": 0, "speed/wps": 5526.222694854463, "speed/FLOPS": 244230757340647.66, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.34, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0474277101457119, "optim/lr": 1.486287314590884e-06, "optim/total_tokens": 2001370873856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2591546773910522, "created_at": "2025-06-03T10:55:41.639257+00:00"} {"global_step": 238583, "acc_step": 0, "speed/wps": 5528.302308163199, "speed/FLOPS": 244322665604467.94, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.35, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739336296916008, "optim/lr": 1.4827400894965591e-06, "optim/total_tokens": 2001379262464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2560458183288574, "created_at": "2025-06-03T10:55:44.611636+00:00"} {"global_step": 238584, "acc_step": 0, "speed/wps": 5525.2526589012205, "speed/FLOPS": 244187886716608.47, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04777663201093674, "optim/lr": 1.4791928644020125e-06, "optim/total_tokens": 2001387651072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2532414197921753, "created_at": "2025-06-03T10:55:47.586587+00:00"} {"global_step": 238585, "acc_step": 0, "speed/wps": 5525.666479882824, "speed/FLOPS": 244206175485867.53, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04704270884394646, "optim/lr": 1.4756456393074657e-06, "optim/total_tokens": 2001396039680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2697831392288208, "created_at": "2025-06-03T10:55:50.561959+00:00"} {"global_step": 238586, "acc_step": 0, "speed/wps": 5511.42670551958, "speed/FLOPS": 243576850344784.6, "speed/curr_iter_time": 2.9718, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9718, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.95, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0473766103386879, "optim/lr": 1.472098414212919e-06, "optim/total_tokens": 2001404428288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2694692611694336, "created_at": "2025-06-03T10:55:53.540344+00:00"} {"global_step": 238587, "acc_step": 0, "speed/wps": 5525.785121940256, "speed/FLOPS": 244211418857540.94, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04750186204910278, "optim/lr": 1.4685511891185942e-06, "optim/total_tokens": 2001412816896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 424, "loss/out": 1.250872015953064, "created_at": "2025-06-03T10:55:56.513514+00:00"} {"global_step": 238588, "acc_step": 0, "speed/wps": 5522.023340771395, "speed/FLOPS": 244045167384418.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04798848181962967, "optim/lr": 1.4650039640240476e-06, "optim/total_tokens": 2001421205504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.240410327911377, "created_at": "2025-06-03T10:55:59.488327+00:00"} {"global_step": 238589, "acc_step": 0, "speed/wps": 5530.375479435937, "speed/FLOPS": 244414289163270.47, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04718293994665146, "optim/lr": 1.4614567389295008e-06, "optim/total_tokens": 2001429594112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2368203401565552, "created_at": "2025-06-03T10:56:02.459736+00:00"} {"global_step": 238590, "acc_step": 0, "speed/wps": 5536.6348503404, "speed/FLOPS": 244690921318883.06, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04763130098581314, "optim/lr": 1.457909513834954e-06, "optim/total_tokens": 2001437982720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.259989857673645, "created_at": "2025-06-03T10:56:05.423241+00:00"} {"global_step": 238591, "acc_step": 0, "speed/wps": 5526.115144927112, "speed/FLOPS": 244226004184349.2, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048319801688194275, "optim/lr": 1.4543622887406293e-06, "optim/total_tokens": 2001446371328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2474374771118164, "created_at": "2025-06-03T10:56:08.394365+00:00"} {"global_step": 238592, "acc_step": 0, "speed/wps": 5527.277633624489, "speed/FLOPS": 244277380234616.7, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048431556671857834, "optim/lr": 1.4508150636460827e-06, "optim/total_tokens": 2001454759936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2525361776351929, "created_at": "2025-06-03T10:56:11.368147+00:00"} {"global_step": 238593, "acc_step": 0, "speed/wps": 5525.834977458236, "speed/FLOPS": 244213622216251.97, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.34 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.34, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04803206026554108, "optim/lr": 1.4472678385515359e-06, "optim/total_tokens": 2001463148544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2491687536239624, "created_at": "2025-06-03T10:56:14.337819+00:00"} {"global_step": 238594, "acc_step": 0, "speed/wps": 5526.717546679659, "speed/FLOPS": 244252627258440.06, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04719332978129387, "optim/lr": 1.4437206134572112e-06, "optim/total_tokens": 2001471537152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.250219702720642, "created_at": "2025-06-03T10:56:17.306992+00:00"} {"global_step": 238595, "acc_step": 0, "speed/wps": 5521.089210017867, "speed/FLOPS": 244003883586427.47, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048877403140068054, "optim/lr": 1.4401733883626644e-06, "optim/total_tokens": 2001479925760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2546590566635132, "created_at": "2025-06-03T10:56:20.281673+00:00"} {"global_step": 238596, "acc_step": 0, "speed/wps": 5524.352582518455, "speed/FLOPS": 244148107947498.78, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047920797020196915, "optim/lr": 1.4366261632681178e-06, "optim/total_tokens": 2001488314368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2562156915664673, "created_at": "2025-06-03T10:56:23.252094+00:00"} {"global_step": 238597, "acc_step": 0, "speed/wps": 5515.895860067239, "speed/FLOPS": 243774364100584.44, "speed/curr_iter_time": 2.9695, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9695, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04920642077922821, "optim/lr": 1.433078938173571e-06, "optim/total_tokens": 2001496702976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2439919710159302, "created_at": "2025-06-03T10:56:26.226914+00:00"} {"global_step": 238598, "acc_step": 0, "speed/wps": 5521.116369754387, "speed/FLOPS": 244005083907765.5, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04758751764893532, "optim/lr": 1.4295317130792463e-06, "optim/total_tokens": 2001505091584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2507623434066772, "created_at": "2025-06-03T10:56:29.202939+00:00"} {"global_step": 238599, "acc_step": 0, "speed/wps": 5542.432314377614, "speed/FLOPS": 244947139555216.94, "speed/curr_iter_time": 2.9552, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9552, "speed/est_time_elapsed": "8.16 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 195.86, "speed/est_time_elapsed_days": 8.16, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04704418033361435, "optim/lr": 1.4259844879846995e-06, "optim/total_tokens": 2001513480192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2551233768463135, "created_at": "2025-06-03T10:56:32.168422+00:00"} {"global_step": 238600, "acc_step": 0, "speed/wps": 5530.928473410846, "speed/FLOPS": 244438728666481.66, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048309214413166046, "optim/lr": 1.4224372628901526e-06, "optim/total_tokens": 2001521868800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.264228343963623, "created_at": "2025-06-03T10:56:35.135576+00:00"} {"global_step": 238601, "acc_step": 0, "speed/wps": 5530.144506745145, "speed/FLOPS": 244404081352562.84, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04724716395139694, "optim/lr": 1.418890037795606e-06, "optim/total_tokens": 2001530257408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2550766468048096, "created_at": "2025-06-03T10:56:38.102663+00:00"} {"global_step": 238602, "acc_step": 0, "speed/wps": 5528.958175255569, "speed/FLOPS": 244351651572918.6, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.26, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046631742268800735, "optim/lr": 1.4153428127012813e-06, "optim/total_tokens": 2001538646016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.258544921875, "created_at": "2025-06-03T10:56:41.073669+00:00"} {"global_step": 238603, "acc_step": 0, "speed/wps": 5534.684808031453, "speed/FLOPS": 244604739430048.97, "speed/curr_iter_time": 2.9594, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9594, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.14, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.05147739499807358, "optim/lr": 1.4117955876067345e-06, "optim/total_tokens": 2001547034624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2423237562179565, "created_at": "2025-06-03T10:56:44.043644+00:00"} {"global_step": 238604, "acc_step": 0, "speed/wps": 5517.151569501364, "speed/FLOPS": 243829860030269.25, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.05784420296549797, "optim/lr": 1.4082483625121877e-06, "optim/total_tokens": 2001555423232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.26542067527771, "created_at": "2025-06-03T10:56:47.018389+00:00"} {"global_step": 238605, "acc_step": 0, "speed/wps": 5519.682113634991, "speed/FLOPS": 243941697128476.5, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.33 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.33, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04677354916930199, "optim/lr": 1.404701137417641e-06, "optim/total_tokens": 2001563811840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.240793228149414, "created_at": "2025-06-03T10:56:49.991495+00:00"} {"global_step": 238606, "acc_step": 0, "speed/wps": 5523.388414102644, "speed/FLOPS": 244105496638581.25, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.55, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04830425977706909, "optim/lr": 1.4011539123233164e-06, "optim/total_tokens": 2001572200448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2465170621871948, "created_at": "2025-06-03T10:56:52.962653+00:00"} {"global_step": 238607, "acc_step": 0, "speed/wps": 5548.5351097012135, "speed/FLOPS": 245216851871581.9, "speed/curr_iter_time": 2.952, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.952, "speed/est_time_elapsed": "8.15 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 195.66, "speed/est_time_elapsed_days": 8.15, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04730795696377754, "optim/lr": 1.3976066872287696e-06, "optim/total_tokens": 2001580589056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.247576117515564, "created_at": "2025-06-03T10:56:55.919765+00:00"} {"global_step": 238608, "acc_step": 0, "speed/wps": 5531.33864279003, "speed/FLOPS": 244456856053604.38, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04734605923295021, "optim/lr": 1.3940594621342228e-06, "optim/total_tokens": 2001588977664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.255759835243225, "created_at": "2025-06-03T10:56:58.886390+00:00"} {"global_step": 238609, "acc_step": 0, "speed/wps": 5526.083600670317, "speed/FLOPS": 244224610089656.97, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048422276973724365, "optim/lr": 1.3905122370396762e-06, "optim/total_tokens": 2001597366272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2611570358276367, "created_at": "2025-06-03T10:57:01.859348+00:00"} {"global_step": 238610, "acc_step": 0, "speed/wps": 5529.485269758012, "speed/FLOPS": 244374946452012.34, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047291625291109085, "optim/lr": 1.3869650119453515e-06, "optim/total_tokens": 2001605754880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2610499858856201, "created_at": "2025-06-03T10:57:04.826664+00:00"} {"global_step": 238611, "acc_step": 0, "speed/wps": 5527.112402989386, "speed/FLOPS": 244270077886272.22, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.049832165241241455, "optim/lr": 1.3834177868508047e-06, "optim/total_tokens": 2001614143488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2587326765060425, "created_at": "2025-06-03T10:57:07.794993+00:00"} {"global_step": 238612, "acc_step": 0, "speed/wps": 5532.478263397642, "speed/FLOPS": 244507221451353.78, "speed/curr_iter_time": 2.9591, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9591, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047210872173309326, "optim/lr": 1.3798705617562579e-06, "optim/total_tokens": 2001622532096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2297091484069824, "created_at": "2025-06-03T10:57:10.760583+00:00"} {"global_step": 238613, "acc_step": 0, "speed/wps": 5514.701080928146, "speed/FLOPS": 243721560978070.6, "speed/curr_iter_time": 2.97, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.97, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.86, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04985015466809273, "optim/lr": 1.3763233366617113e-06, "optim/total_tokens": 2001630920704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2546573877334595, "created_at": "2025-06-03T10:57:13.739786+00:00"} {"global_step": 238614, "acc_step": 0, "speed/wps": 5518.410060906998, "speed/FLOPS": 243885478908855.34, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.73, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046712327748537064, "optim/lr": 1.3727761115673866e-06, "optim/total_tokens": 2001639309312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2422726154327393, "created_at": "2025-06-03T10:57:16.713486+00:00"} {"global_step": 238615, "acc_step": 0, "speed/wps": 5514.186813687258, "speed/FLOPS": 243698832998281.7, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048468511551618576, "optim/lr": 1.3692288864728398e-06, "optim/total_tokens": 2001647697920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2599049806594849, "created_at": "2025-06-03T10:57:19.693470+00:00"} {"global_step": 238616, "acc_step": 0, "speed/wps": 5538.286987385837, "speed/FLOPS": 244763937319887.4, "speed/curr_iter_time": 2.9574, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9574, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.02, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04807205870747566, "optim/lr": 1.365681661378293e-06, "optim/total_tokens": 2001656086528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2648741006851196, "created_at": "2025-06-03T10:57:22.656007+00:00"} {"global_step": 238617, "acc_step": 0, "speed/wps": 5523.568919656849, "speed/FLOPS": 244113474060165.94, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.55, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047134123742580414, "optim/lr": 1.3621344362837463e-06, "optim/total_tokens": 2001664475136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2550768852233887, "created_at": "2025-06-03T10:57:25.632406+00:00"} {"global_step": 238618, "acc_step": 0, "speed/wps": 5512.6352730117715, "speed/FLOPS": 243630262841930.25, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.32 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.32, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047621071338653564, "optim/lr": 1.3585872111894214e-06, "optim/total_tokens": 2001672863744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.267863154411316, "created_at": "2025-06-03T10:57:28.612455+00:00"} {"global_step": 238619, "acc_step": 0, "speed/wps": 5524.815909753537, "speed/FLOPS": 244168584639765.66, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739217832684517, "optim/lr": 1.3550399860948748e-06, "optim/total_tokens": 2001681252352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2625871896743774, "created_at": "2025-06-03T10:57:31.582585+00:00"} {"global_step": 238620, "acc_step": 0, "speed/wps": 5535.819861750072, "speed/FLOPS": 244654902994680.34, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.12, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048949744552373886, "optim/lr": 1.351492761000328e-06, "optim/total_tokens": 2001689640960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2613669633865356, "created_at": "2025-06-03T10:57:34.551996+00:00"} {"global_step": 238621, "acc_step": 0, "speed/wps": 5513.416808227515, "speed/FLOPS": 243664802698206.25, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.91, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04713015258312225, "optim/lr": 1.3479455359060033e-06, "optim/total_tokens": 2001698029568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2553143501281738, "created_at": "2025-06-03T10:57:37.530485+00:00"} {"global_step": 238622, "acc_step": 0, "speed/wps": 5507.624132204748, "speed/FLOPS": 243408796067603.66, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047529492527246475, "optim/lr": 1.3443983108114565e-06, "optim/total_tokens": 2001706418176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2558797597885132, "created_at": "2025-06-03T10:57:40.513676+00:00"} {"global_step": 238623, "acc_step": 0, "speed/wps": 5516.206552120093, "speed/FLOPS": 243788095099054.53, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04757550358772278, "optim/lr": 1.34085108571691e-06, "optim/total_tokens": 2001714806784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2337532043457031, "created_at": "2025-06-03T10:57:43.488698+00:00"} {"global_step": 238624, "acc_step": 0, "speed/wps": 5539.73466247423, "speed/FLOPS": 244827917148921.56, "speed/curr_iter_time": 2.9566, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9566, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 195.98, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048314180225133896, "optim/lr": 1.337303860622363e-06, "optim/total_tokens": 2001723195392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2624696493148804, "created_at": "2025-06-03T10:57:46.450450+00:00"} {"global_step": 238625, "acc_step": 0, "speed/wps": 5523.475978874354, "speed/FLOPS": 244109366553293.72, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046874821186065674, "optim/lr": 1.3337566355280384e-06, "optim/total_tokens": 2001731584000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.26666259765625, "created_at": "2025-06-03T10:57:49.423622+00:00"} {"global_step": 238626, "acc_step": 0, "speed/wps": 5524.762572627335, "speed/FLOPS": 244166227411791.7, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04925169423222542, "optim/lr": 1.3302094104334916e-06, "optim/total_tokens": 2001739972608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2479629516601562, "created_at": "2025-06-03T10:57:52.394715+00:00"} {"global_step": 238627, "acc_step": 0, "speed/wps": 5527.296066083703, "speed/FLOPS": 244278194854968.1, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04742039740085602, "optim/lr": 1.326662185338945e-06, "optim/total_tokens": 2001748361216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2647074460983276, "created_at": "2025-06-03T10:57:55.363273+00:00"} {"global_step": 238628, "acc_step": 0, "speed/wps": 5536.4971882501095, "speed/FLOPS": 244684837359110.7, "speed/curr_iter_time": 2.9584, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9584, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04707242175936699, "optim/lr": 1.3231149602443982e-06, "optim/total_tokens": 2001756749824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.247788906097412, "created_at": "2025-06-03T10:57:58.329197+00:00"} {"global_step": 238629, "acc_step": 0, "speed/wps": 5521.036785611778, "speed/FLOPS": 244001566696010.78, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04714136943221092, "optim/lr": 1.3195677351500735e-06, "optim/total_tokens": 2001765138432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.245046615600586, "created_at": "2025-06-03T10:58:01.302821+00:00"} {"global_step": 238630, "acc_step": 0, "speed/wps": 5517.451825248635, "speed/FLOPS": 243843129797450.4, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.31 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.31, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046784620732069016, "optim/lr": 1.3160205100555267e-06, "optim/total_tokens": 2001773527040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.243311882019043, "created_at": "2025-06-03T10:58:04.279818+00:00"} {"global_step": 238631, "acc_step": 0, "speed/wps": 5531.424101006416, "speed/FLOPS": 244460632869353.84, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04703879356384277, "optim/lr": 1.31247328496098e-06, "optim/total_tokens": 2001781915648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2510433197021484, "created_at": "2025-06-03T10:58:07.250206+00:00"} {"global_step": 238632, "acc_step": 0, "speed/wps": 5514.662401567211, "speed/FLOPS": 243719851548296.16, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04846637323498726, "optim/lr": 1.3089260598664332e-06, "optim/total_tokens": 2001790304256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2685184478759766, "created_at": "2025-06-03T10:58:10.225278+00:00"} {"global_step": 238633, "acc_step": 0, "speed/wps": 5539.713139117851, "speed/FLOPS": 244826965926736.1, "speed/curr_iter_time": 2.9567, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9567, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04897778481245041, "optim/lr": 1.3053788347721086e-06, "optim/total_tokens": 2001798692864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.258244514465332, "created_at": "2025-06-03T10:58:13.187683+00:00"} {"global_step": 238634, "acc_step": 0, "speed/wps": 5539.700737522464, "speed/FLOPS": 244826417839697.12, "speed/curr_iter_time": 2.9567, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9567, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 195.99, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047549642622470856, "optim/lr": 1.3018316096775617e-06, "optim/total_tokens": 2001807081472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2623533010482788, "created_at": "2025-06-03T10:58:16.149917+00:00"} {"global_step": 238635, "acc_step": 0, "speed/wps": 5529.073533620526, "speed/FLOPS": 244356749822192.06, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04754720255732536, "optim/lr": 1.298284384583015e-06, "optim/total_tokens": 2001815470080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2400695085525513, "created_at": "2025-06-03T10:58:19.117394+00:00"} {"global_step": 238636, "acc_step": 0, "speed/wps": 5523.796399201261, "speed/FLOPS": 244123527491683.1, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04836700111627579, "optim/lr": 1.2947371594884683e-06, "optim/total_tokens": 2001823858688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2592862844467163, "created_at": "2025-06-03T10:58:22.087849+00:00"} {"global_step": 238637, "acc_step": 0, "speed/wps": 5530.543368045283, "speed/FLOPS": 244421708980471.75, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04819127172231674, "optim/lr": 1.2911899343941436e-06, "optim/total_tokens": 2001832247296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2450453042984009, "created_at": "2025-06-03T10:58:25.058581+00:00"} {"global_step": 238638, "acc_step": 0, "speed/wps": 5522.887946265425, "speed/FLOPS": 244083378521802.78, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04815983772277832, "optim/lr": 1.2876427092995968e-06, "optim/total_tokens": 2001840635904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.259925127029419, "created_at": "2025-06-03T10:58:28.030143+00:00"} {"global_step": 238639, "acc_step": 0, "speed/wps": 5518.395327164604, "speed/FLOPS": 243884827752855.66, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.049485571682453156, "optim/lr": 1.28409548420505e-06, "optim/total_tokens": 2001849024512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2596884965896606, "created_at": "2025-06-03T10:58:31.003288+00:00"} {"global_step": 238640, "acc_step": 0, "speed/wps": 5523.277911177768, "speed/FLOPS": 244100612974907.0, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04729330539703369, "optim/lr": 1.2805482591105034e-06, "optim/total_tokens": 2001857413120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2511224746704102, "created_at": "2025-06-03T10:58:33.974148+00:00"} {"global_step": 238641, "acc_step": 0, "speed/wps": 5528.13174487844, "speed/FLOPS": 244315127580303.66, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.3 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.3, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047377247363328934, "optim/lr": 1.2770010340161787e-06, "optim/total_tokens": 2001865801728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2443593740463257, "created_at": "2025-06-03T10:58:36.942960+00:00"} {"global_step": 238642, "acc_step": 0, "speed/wps": 5536.282846139953, "speed/FLOPS": 244675364534944.16, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.03, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04745880141854286, "optim/lr": 1.2734538089216319e-06, "optim/total_tokens": 2001874190336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2413769960403442, "created_at": "2025-06-03T10:58:39.910369+00:00"} {"global_step": 238643, "acc_step": 0, "speed/wps": 5527.343291355405, "speed/FLOPS": 244280281970256.47, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048329196870326996, "optim/lr": 1.269906583827085e-06, "optim/total_tokens": 2001882578944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2410004138946533, "created_at": "2025-06-03T10:58:42.882995+00:00"} {"global_step": 238644, "acc_step": 0, "speed/wps": 5527.878095479357, "speed/FLOPS": 244303917575159.5, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04749860614538193, "optim/lr": 1.2663593587325385e-06, "optim/total_tokens": 2001890967552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2531646490097046, "created_at": "2025-06-03T10:58:45.851871+00:00"} {"global_step": 238645, "acc_step": 0, "speed/wps": 5529.427275501528, "speed/FLOPS": 244372383402717.28, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.37, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047758348286151886, "optim/lr": 1.2628121336382138e-06, "optim/total_tokens": 2001899356160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.240869164466858, "created_at": "2025-06-03T10:58:48.819127+00:00"} {"global_step": 238646, "acc_step": 0, "speed/wps": 5509.386049975125, "speed/FLOPS": 243486663814741.66, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04714064672589302, "optim/lr": 1.259264908543667e-06, "optim/total_tokens": 2001907744768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2638109922409058, "created_at": "2025-06-03T10:58:51.798508+00:00"} {"global_step": 238647, "acc_step": 0, "speed/wps": 5513.339007887943, "speed/FLOPS": 243661364321415.4, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04742991924285889, "optim/lr": 1.2557176834491201e-06, "optim/total_tokens": 2001916133376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2461106777191162, "created_at": "2025-06-03T10:58:54.776351+00:00"} {"global_step": 238648, "acc_step": 0, "speed/wps": 5536.127126842432, "speed/FLOPS": 244668482539037.3, "speed/curr_iter_time": 2.9586, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9586, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.13, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04718904569745064, "optim/lr": 1.2521704583547955e-06, "optim/total_tokens": 2001924521984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2486931085586548, "created_at": "2025-06-03T10:58:57.743318+00:00"} {"global_step": 238649, "acc_step": 0, "speed/wps": 5528.865717225825, "speed/FLOPS": 244347565401247.03, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0470108687877655, "optim/lr": 1.2486232332602486e-06, "optim/total_tokens": 2001932910592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.2440941333770752, "created_at": "2025-06-03T10:59:00.711706+00:00"} {"global_step": 238650, "acc_step": 0, "speed/wps": 5522.541065810372, "speed/FLOPS": 244068048181184.56, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04770737141370773, "optim/lr": 1.245076008165702e-06, "optim/total_tokens": 2001941299200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2713247537612915, "created_at": "2025-06-03T10:59:03.684509+00:00"} {"global_step": 238651, "acc_step": 0, "speed/wps": 5520.073106443752, "speed/FLOPS": 243958977009341.16, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04850462079048157, "optim/lr": 1.2415287830711552e-06, "optim/total_tokens": 2001949687808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.253462314605713, "created_at": "2025-06-03T10:59:06.657448+00:00"} {"global_step": 238652, "acc_step": 0, "speed/wps": 5529.018229279052, "speed/FLOPS": 244354305653372.22, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04767799377441406, "optim/lr": 1.2379815579768305e-06, "optim/total_tokens": 2001958076416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2609624862670898, "created_at": "2025-06-03T10:59:09.628490+00:00"} {"global_step": 238653, "acc_step": 0, "speed/wps": 5525.736199362205, "speed/FLOPS": 244209256729999.53, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.29 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.29, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04720618203282356, "optim/lr": 1.2344343328822837e-06, "optim/total_tokens": 2001966465024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2454270124435425, "created_at": "2025-06-03T10:59:12.598236+00:00"} {"global_step": 238654, "acc_step": 0, "speed/wps": 5527.680309430892, "speed/FLOPS": 244295176444178.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.43, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04746196046471596, "optim/lr": 1.2308871077877371e-06, "optim/total_tokens": 2001974853632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2519828081130981, "created_at": "2025-06-03T10:59:15.566844+00:00"} {"global_step": 238655, "acc_step": 0, "speed/wps": 5530.936119394075, "speed/FLOPS": 244439066579804.7, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047309182584285736, "optim/lr": 1.2273398826931903e-06, "optim/total_tokens": 2001983242240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2708367109298706, "created_at": "2025-06-03T10:59:18.535764+00:00"} {"global_step": 238656, "acc_step": 0, "speed/wps": 5524.14803245144, "speed/FLOPS": 244139067881518.84, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047652941197156906, "optim/lr": 1.2237926575988656e-06, "optim/total_tokens": 2001991630848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2608144283294678, "created_at": "2025-06-03T10:59:21.511328+00:00"} {"global_step": 238657, "acc_step": 0, "speed/wps": 5531.097166849504, "speed/FLOPS": 244446184053019.06, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.32, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04777959734201431, "optim/lr": 1.2202454325043188e-06, "optim/total_tokens": 2002000019456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.257479190826416, "created_at": "2025-06-03T10:59:24.478855+00:00"} {"global_step": 238658, "acc_step": 0, "speed/wps": 5531.174922245984, "speed/FLOPS": 244449620443555.28, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.31, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047604821622371674, "optim/lr": 1.2166982074097722e-06, "optim/total_tokens": 2002008408064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2502632141113281, "created_at": "2025-06-03T10:59:27.450009+00:00"} {"global_step": 238659, "acc_step": 0, "speed/wps": 5529.808397920367, "speed/FLOPS": 244389227062868.56, "speed/curr_iter_time": 2.9606, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9606, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048616569489240646, "optim/lr": 1.2131509823152254e-06, "optim/total_tokens": 2002016796672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2472293376922607, "created_at": "2025-06-03T10:59:30.421972+00:00"} {"global_step": 238660, "acc_step": 0, "speed/wps": 5519.90437422682, "speed/FLOPS": 243951519909002.53, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04704924672842026, "optim/lr": 1.2096037572209007e-06, "optim/total_tokens": 2002025185280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2610961198806763, "created_at": "2025-06-03T10:59:33.394562+00:00"} {"global_step": 238661, "acc_step": 0, "speed/wps": 5523.126728728773, "speed/FLOPS": 244093931484483.3, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047521576285362244, "optim/lr": 1.2060565321263539e-06, "optim/total_tokens": 2002033573888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.251218318939209, "created_at": "2025-06-03T10:59:36.368908+00:00"} {"global_step": 238662, "acc_step": 0, "speed/wps": 5521.167791095581, "speed/FLOPS": 244007356467848.0, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046859510242938995, "optim/lr": 1.2025093070318073e-06, "optim/total_tokens": 2002041962496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2386021614074707, "created_at": "2025-06-03T10:59:39.344665+00:00"} {"global_step": 238663, "acc_step": 0, "speed/wps": 5527.25310409154, "speed/FLOPS": 244276296154813.9, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04738011956214905, "optim/lr": 1.1989620819372604e-06, "optim/total_tokens": 2002050351104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2449008226394653, "created_at": "2025-06-03T10:59:42.316560+00:00"} {"global_step": 238664, "acc_step": 0, "speed/wps": 5513.119479398223, "speed/FLOPS": 243651662285818.47, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.96, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04808586463332176, "optim/lr": 1.1954148568429358e-06, "optim/total_tokens": 2002058739712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2422853708267212, "created_at": "2025-06-03T10:59:45.295050+00:00"} {"global_step": 238665, "acc_step": 0, "speed/wps": 5522.307352432389, "speed/FLOPS": 244057719246131.25, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.28 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.28, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0475703664124012, "optim/lr": 1.191867631748389e-06, "optim/total_tokens": 2002067128320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2526609897613525, "created_at": "2025-06-03T10:59:48.266750+00:00"} {"global_step": 238666, "acc_step": 0, "speed/wps": 5532.510244775879, "speed/FLOPS": 244508634864576.34, "speed/curr_iter_time": 2.9593, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9593, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.19, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047072116285562515, "optim/lr": 1.1883204066538421e-06, "optim/total_tokens": 2002075516928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2509781122207642, "created_at": "2025-06-03T10:59:51.239550+00:00"} {"global_step": 238667, "acc_step": 0, "speed/wps": 5520.540437687883, "speed/FLOPS": 243979630658313.6, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04697861149907112, "optim/lr": 1.1847731815592955e-06, "optim/total_tokens": 2002083905536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2590638399124146, "created_at": "2025-06-03T10:59:54.215663+00:00"} {"global_step": 238668, "acc_step": 0, "speed/wps": 5521.616172113553, "speed/FLOPS": 244027172613820.28, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04741499572992325, "optim/lr": 1.1812259564649708e-06, "optim/total_tokens": 2002092294144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2488300800323486, "created_at": "2025-06-03T10:59:57.188823+00:00"} {"global_step": 238669, "acc_step": 0, "speed/wps": 5530.821186254208, "speed/FLOPS": 244433987123303.72, "speed/curr_iter_time": 2.9602, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9602, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04718455672264099, "optim/lr": 1.177678731370424e-06, "optim/total_tokens": 2002100682752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2510156631469727, "created_at": "2025-06-03T11:00:00.159854+00:00"} {"global_step": 238670, "acc_step": 0, "speed/wps": 5522.833365064593, "speed/FLOPS": 244080966312097.9, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047187309712171555, "optim/lr": 1.1741315062758772e-06, "optim/total_tokens": 2002109071360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2564897537231445, "created_at": "2025-06-03T11:00:03.131138+00:00"} {"global_step": 238671, "acc_step": 0, "speed/wps": 5521.286742572372, "speed/FLOPS": 244012613514273.28, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0476849302649498, "optim/lr": 1.1705842811813306e-06, "optim/total_tokens": 2002117459968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2465076446533203, "created_at": "2025-06-03T11:00:06.107802+00:00"} {"global_step": 238672, "acc_step": 0, "speed/wps": 5524.445005464241, "speed/FLOPS": 244152192568639.0, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04731171578168869, "optim/lr": 1.167037056087006e-06, "optim/total_tokens": 2002125848576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2521125078201294, "created_at": "2025-06-03T11:00:09.080661+00:00"} {"global_step": 238673, "acc_step": 0, "speed/wps": 5529.362454591605, "speed/FLOPS": 244369518650282.16, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0480937585234642, "optim/lr": 1.163489830992459e-06, "optim/total_tokens": 2002134237184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2427572011947632, "created_at": "2025-06-03T11:00:12.052002+00:00"} {"global_step": 238674, "acc_step": 0, "speed/wps": 5532.617801483415, "speed/FLOPS": 244513388320524.28, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.28, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04761091619729996, "optim/lr": 1.1599426058979123e-06, "optim/total_tokens": 2002142625792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.248929738998413, "created_at": "2025-06-03T11:00:15.021957+00:00"} {"global_step": 238675, "acc_step": 0, "speed/wps": 5521.821582862317, "speed/FLOPS": 244036250717528.1, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047468218952417374, "optim/lr": 1.1563953808035876e-06, "optim/total_tokens": 2002151014400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2591021060943604, "created_at": "2025-06-03T11:00:17.997092+00:00"} {"global_step": 238676, "acc_step": 0, "speed/wps": 5526.807572786836, "speed/FLOPS": 244256605951581.94, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04717239737510681, "optim/lr": 1.152848155709041e-06, "optim/total_tokens": 2002159403008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2409127950668335, "created_at": "2025-06-03T11:00:20.965822+00:00"} {"global_step": 238677, "acc_step": 0, "speed/wps": 5527.452575449501, "speed/FLOPS": 244285111767848.78, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.27 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.27, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047591179609298706, "optim/lr": 1.1493009306144942e-06, "optim/total_tokens": 2002167791616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2458300590515137, "created_at": "2025-06-03T11:00:23.938654+00:00"} {"global_step": 238678, "acc_step": 0, "speed/wps": 5532.889748092207, "speed/FLOPS": 244525406968683.97, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04755554348230362, "optim/lr": 1.1457537055199474e-06, "optim/total_tokens": 2002176180224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 423, "loss/out": 1.2584998607635498, "created_at": "2025-06-03T11:00:26.904274+00:00"} {"global_step": 238679, "acc_step": 0, "speed/wps": 5525.999910409198, "speed/FLOPS": 244220911408481.1, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04766048118472099, "optim/lr": 1.1422064804256227e-06, "optim/total_tokens": 2002184568832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2770662307739258, "created_at": "2025-06-03T11:00:29.876249+00:00"} {"global_step": 238680, "acc_step": 0, "speed/wps": 5513.981108154119, "speed/FLOPS": 243689741866613.3, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04713594540953636, "optim/lr": 1.1386592553310759e-06, "optim/total_tokens": 2002192957440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2436672449111938, "created_at": "2025-06-03T11:00:32.852833+00:00"} {"global_step": 238681, "acc_step": 0, "speed/wps": 5526.289673785425, "speed/FLOPS": 244233717466566.97, "speed/curr_iter_time": 2.9639, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9639, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739224910736084, "optim/lr": 1.1351120302365292e-06, "optim/total_tokens": 2002201346048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2610291242599487, "created_at": "2025-06-03T11:00:35.826800+00:00"} {"global_step": 238682, "acc_step": 0, "speed/wps": 5518.641913276912, "speed/FLOPS": 243895725596877.53, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04865814745426178, "optim/lr": 1.1315648051419824e-06, "optim/total_tokens": 2002209734656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2361960411071777, "created_at": "2025-06-03T11:00:38.805281+00:00"} {"global_step": 238683, "acc_step": 0, "speed/wps": 5536.213419090025, "speed/FLOPS": 244672296214697.2, "speed/curr_iter_time": 2.9572, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9572, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.06, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047277458012104034, "optim/lr": 1.1280175800476577e-06, "optim/total_tokens": 2002218123264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2441821098327637, "created_at": "2025-06-03T11:00:41.769124+00:00"} {"global_step": 238684, "acc_step": 0, "speed/wps": 5533.695467631896, "speed/FLOPS": 244561015648291.75, "speed/curr_iter_time": 2.9599, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9599, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0477253794670105, "optim/lr": 1.124470354953111e-06, "optim/total_tokens": 2002226511872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2427775859832764, "created_at": "2025-06-03T11:00:44.734566+00:00"} {"global_step": 238685, "acc_step": 0, "speed/wps": 5522.287968615306, "speed/FLOPS": 244056862580631.56, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04674021899700165, "optim/lr": 1.1209231298585643e-06, "optim/total_tokens": 2002234900480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2445566654205322, "created_at": "2025-06-03T11:00:47.707069+00:00"} {"global_step": 238686, "acc_step": 0, "speed/wps": 5525.173417490583, "speed/FLOPS": 244184384651852.6, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04766249284148216, "optim/lr": 1.1173759047640175e-06, "optim/total_tokens": 2002243289088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2573546171188354, "created_at": "2025-06-03T11:00:50.677229+00:00"} {"global_step": 238687, "acc_step": 0, "speed/wps": 5529.647035300868, "speed/FLOPS": 244382095661015.47, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.05132071673870087, "optim/lr": 1.1138286796696928e-06, "optim/total_tokens": 2002251677696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2480852603912354, "created_at": "2025-06-03T11:00:53.651230+00:00"} {"global_step": 238688, "acc_step": 0, "speed/wps": 5525.42828649012, "speed/FLOPS": 244195648557094.3, "speed/curr_iter_time": 2.9643, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9643, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048611681908369064, "optim/lr": 1.110281454575146e-06, "optim/total_tokens": 2002260066304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2514582872390747, "created_at": "2025-06-03T11:00:56.622813+00:00"} {"global_step": 238689, "acc_step": 0, "speed/wps": 5515.482359052109, "speed/FLOPS": 243756089472205.78, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04709245637059212, "optim/lr": 1.1067342294805994e-06, "optim/total_tokens": 2002268454912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2628675699234009, "created_at": "2025-06-03T11:00:59.602166+00:00"} {"global_step": 238690, "acc_step": 0, "speed/wps": 5522.035776877471, "speed/FLOPS": 244045716996653.56, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.26 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.26, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04704916477203369, "optim/lr": 1.1031870043860526e-06, "optim/total_tokens": 2002276843520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2522690296173096, "created_at": "2025-06-03T11:01:02.574216+00:00"} {"global_step": 238691, "acc_step": 0, "speed/wps": 5520.674760674445, "speed/FLOPS": 243985567046792.25, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047508493065834045, "optim/lr": 1.099639779291728e-06, "optim/total_tokens": 2002285232128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2595622539520264, "created_at": "2025-06-03T11:01:05.546622+00:00"} {"global_step": 238692, "acc_step": 0, "speed/wps": 5532.625476497667, "speed/FLOPS": 244513727516869.94, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04721933230757713, "optim/lr": 1.096092554197181e-06, "optim/total_tokens": 2002293620736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2485898733139038, "created_at": "2025-06-03T11:01:08.513446+00:00"} {"global_step": 238693, "acc_step": 0, "speed/wps": 5516.139333087059, "speed/FLOPS": 243785124361852.6, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048997413367033005, "optim/lr": 1.0925453291026345e-06, "optim/total_tokens": 2002302009344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2688318490982056, "created_at": "2025-06-03T11:01:11.488452+00:00"} {"global_step": 238694, "acc_step": 0, "speed/wps": 5537.682570038769, "speed/FLOPS": 244737225166835.4, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.11, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04754563421010971, "optim/lr": 1.0889981040080877e-06, "optim/total_tokens": 2002310397952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 421, "loss/out": 1.2561010122299194, "created_at": "2025-06-03T11:01:14.451999+00:00"} {"global_step": 238695, "acc_step": 0, "speed/wps": 5522.769897569945, "speed/FLOPS": 244078161373690.56, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.64, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04847925156354904, "optim/lr": 1.085450878913763e-06, "optim/total_tokens": 2002318786560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 393, "loss/out": 1.2550073862075806, "created_at": "2025-06-03T11:01:17.426039+00:00"} {"global_step": 238696, "acc_step": 0, "speed/wps": 5517.322674930396, "speed/FLOPS": 243837422014435.47, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04865596070885658, "optim/lr": 1.0819036538192162e-06, "optim/total_tokens": 2002327175168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2577022314071655, "created_at": "2025-06-03T11:01:20.400149+00:00"} {"global_step": 238697, "acc_step": 0, "speed/wps": 5511.998888691009, "speed/FLOPS": 243602137912262.78, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 197.02, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04782385006546974, "optim/lr": 1.0783564287246693e-06, "optim/total_tokens": 2002335563776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2556865215301514, "created_at": "2025-06-03T11:01:23.381409+00:00"} {"global_step": 238698, "acc_step": 0, "speed/wps": 5509.660028792765, "speed/FLOPS": 243498772276130.6, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 197.11, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0480060800909996, "optim/lr": 1.0748092036301227e-06, "optim/total_tokens": 2002343952384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2481781244277954, "created_at": "2025-06-03T11:01:26.360382+00:00"} {"global_step": 238699, "acc_step": 0, "speed/wps": 5518.738865057077, "speed/FLOPS": 243900010369316.62, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04869728535413742, "optim/lr": 1.071261978535798e-06, "optim/total_tokens": 2002352340992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2740533351898193, "created_at": "2025-06-03T11:01:29.336659+00:00"} {"global_step": 238700, "acc_step": 0, "speed/wps": 5524.798326658161, "speed/FLOPS": 244167807556948.47, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04828198254108429, "optim/lr": 1.0677147534412512e-06, "optim/total_tokens": 2002360729600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2444959878921509, "created_at": "2025-06-03T11:01:32.306822+00:00"} {"global_step": 238701, "acc_step": 0, "speed/wps": 5533.263729483404, "speed/FLOPS": 244541935031964.6, "speed/curr_iter_time": 2.9601, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9601, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.27, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04732540622353554, "optim/lr": 1.0641675283467044e-06, "optim/total_tokens": 2002369118208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2622710466384888, "created_at": "2025-06-03T11:01:35.274164+00:00"} {"global_step": 238702, "acc_step": 0, "speed/wps": 5527.883651678978, "speed/FLOPS": 244304163130743.53, "speed/curr_iter_time": 2.963, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.963, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.25 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.25, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047024525701999664, "optim/lr": 1.0606203032523797e-06, "optim/total_tokens": 2002377506816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2533776760101318, "created_at": "2025-06-03T11:01:38.247084+00:00"} {"global_step": 238703, "acc_step": 0, "speed/wps": 5517.799599582706, "speed/FLOPS": 243858499642945.94, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047579701989889145, "optim/lr": 1.0570730781578331e-06, "optim/total_tokens": 2002385895424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2511898279190063, "created_at": "2025-06-03T11:01:41.220661+00:00"} {"global_step": 238704, "acc_step": 0, "speed/wps": 5509.35374358113, "speed/FLOPS": 243485236037486.2, "speed/curr_iter_time": 2.9729, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9729, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 197.12, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.052028220146894455, "optim/lr": 1.0535258530632863e-06, "optim/total_tokens": 2002394284032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2536205053329468, "created_at": "2025-06-03T11:01:44.199184+00:00"} {"global_step": 238705, "acc_step": 0, "speed/wps": 5511.968710834646, "speed/FLOPS": 243600804205475.8, "speed/curr_iter_time": 2.9715, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9715, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 197.03, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04754041135311127, "optim/lr": 1.0499786279687395e-06, "optim/total_tokens": 2002402672640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.251286506652832, "created_at": "2025-06-03T11:01:47.177381+00:00"} {"global_step": 238706, "acc_step": 0, "speed/wps": 5508.525004936017, "speed/FLOPS": 243448610031241.06, "speed/curr_iter_time": 2.972, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.972, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 197.07, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04848838970065117, "optim/lr": 1.0464314028744148e-06, "optim/total_tokens": 2002411061248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2462286949157715, "created_at": "2025-06-03T11:01:50.156105+00:00"} {"global_step": 238707, "acc_step": 0, "speed/wps": 5517.260612303568, "speed/FLOPS": 243834679163995.03, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.85, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04820597916841507, "optim/lr": 1.0428841777798682e-06, "optim/total_tokens": 2002419449856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2524785995483398, "created_at": "2025-06-03T11:01:53.133111+00:00"} {"global_step": 238708, "acc_step": 0, "speed/wps": 5525.028905466858, "speed/FLOPS": 244177997960083.53, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048143334686756134, "optim/lr": 1.0393369526853214e-06, "optim/total_tokens": 2002427838464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2543538808822632, "created_at": "2025-06-03T11:01:56.103054+00:00"} {"global_step": 238709, "acc_step": 0, "speed/wps": 5520.991358689189, "speed/FLOPS": 243999559058548.38, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04726898670196533, "optim/lr": 1.0357897275907746e-06, "optim/total_tokens": 2002436227072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.244489312171936, "created_at": "2025-06-03T11:01:59.075219+00:00"} {"global_step": 238710, "acc_step": 0, "speed/wps": 5532.519812075398, "speed/FLOPS": 244509057690245.2, "speed/curr_iter_time": 2.959, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.959, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04762660339474678, "optim/lr": 1.0322425024964499e-06, "optim/total_tokens": 2002444615680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.267350435256958, "created_at": "2025-06-03T11:02:02.044492+00:00"} {"global_step": 238711, "acc_step": 0, "speed/wps": 5522.634878821329, "speed/FLOPS": 244072194236090.34, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04902602359652519, "optim/lr": 1.028695277401903e-06, "optim/total_tokens": 2002453004288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.269655704498291, "created_at": "2025-06-03T11:02:05.016456+00:00"} {"global_step": 238712, "acc_step": 0, "speed/wps": 5521.437552667305, "speed/FLOPS": 244019278548553.28, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04724715277552605, "optim/lr": 1.0251480523073565e-06, "optim/total_tokens": 2002461392896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2659300565719604, "created_at": "2025-06-03T11:02:07.993508+00:00"} {"global_step": 238713, "acc_step": 0, "speed/wps": 5513.652282268473, "speed/FLOPS": 243675209445551.2, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.89, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.5873607993125916, "optim/lr": 1.0216008272128096e-06, "optim/total_tokens": 2002469781504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2536565065383911, "created_at": "2025-06-03T11:02:10.969390+00:00"} {"global_step": 238714, "acc_step": 0, "speed/wps": 5513.527039609864, "speed/FLOPS": 243669674361090.72, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04798487573862076, "optim/lr": 1.018053602118485e-06, "optim/total_tokens": 2002478170112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2421891689300537, "created_at": "2025-06-03T11:02:13.948999+00:00"} {"global_step": 238715, "acc_step": 0, "speed/wps": 5510.980776657428, "speed/FLOPS": 243557142571548.28, "speed/curr_iter_time": 2.9721, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9721, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.24 hours", "speed/est_time_elapsed_hrs": 197.08, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.24, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04740402474999428, "optim/lr": 1.0145063770239381e-06, "optim/total_tokens": 2002486558720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2593424320220947, "created_at": "2025-06-03T11:02:16.930224+00:00"} {"global_step": 238716, "acc_step": 0, "speed/wps": 5520.268403197425, "speed/FLOPS": 243967608126234.1, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04816337674856186, "optim/lr": 1.0109591519293915e-06, "optim/total_tokens": 2002494947328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2579699754714966, "created_at": "2025-06-03T11:02:19.906587+00:00"} {"global_step": 238717, "acc_step": 0, "speed/wps": 5528.2088644929945, "speed/FLOPS": 244318535872532.97, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04852655529975891, "optim/lr": 1.0074119268348447e-06, "optim/total_tokens": 2002503335936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2519657611846924, "created_at": "2025-06-03T11:02:22.878690+00:00"} {"global_step": 238718, "acc_step": 0, "speed/wps": 5520.658281081702, "speed/FLOPS": 243984838733143.2, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04755857586860657, "optim/lr": 1.00386470174052e-06, "optim/total_tokens": 2002511724544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2584608793258667, "created_at": "2025-06-03T11:02:25.851229+00:00"} {"global_step": 238719, "acc_step": 0, "speed/wps": 5522.297005683368, "speed/FLOPS": 244057261972783.97, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04720166325569153, "optim/lr": 1.0003174766459732e-06, "optim/total_tokens": 2002520113152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2377302646636963, "created_at": "2025-06-03T11:02:28.822530+00:00"} {"global_step": 238720, "acc_step": 0, "speed/wps": 5520.818695468823, "speed/FLOPS": 243991928227978.7, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04769959673285484, "optim/lr": 9.967702515514266e-07, "optim/total_tokens": 2002528501760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2629183530807495, "created_at": "2025-06-03T11:02:31.798016+00:00"} {"global_step": 238721, "acc_step": 0, "speed/wps": 5528.233469826864, "speed/FLOPS": 244319623302348.5, "speed/curr_iter_time": 2.9628, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9628, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0476657934486866, "optim/lr": 9.932230264568798e-07, "optim/total_tokens": 2002536890368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2433431148529053, "created_at": "2025-06-03T11:02:34.766081+00:00"} {"global_step": 238722, "acc_step": 0, "speed/wps": 5522.215702603946, "speed/FLOPS": 244053668792820.4, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047545239329338074, "optim/lr": 9.896758013625551e-07, "optim/total_tokens": 2002545278976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.24728262424469, "created_at": "2025-06-03T11:02:37.740657+00:00"} {"global_step": 238723, "acc_step": 0, "speed/wps": 5512.854338392923, "speed/FLOPS": 243639944410498.88, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.92, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047906793653964996, "optim/lr": 9.861285762680083e-07, "optim/total_tokens": 2002553667584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2513198852539062, "created_at": "2025-06-03T11:02:40.717130+00:00"} {"global_step": 238724, "acc_step": 0, "speed/wps": 5507.728349466033, "speed/FLOPS": 243413401937120.16, "speed/curr_iter_time": 2.9738, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9738, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 197.2, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04881521686911583, "optim/lr": 9.825813511734617e-07, "optim/total_tokens": 2002562056192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.2589898109436035, "created_at": "2025-06-03T11:02:43.699445+00:00"} {"global_step": 238725, "acc_step": 0, "speed/wps": 5532.04253661326, "speed/FLOPS": 244487964557736.0, "speed/curr_iter_time": 2.9607, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9607, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.33, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04768824577331543, "optim/lr": 9.790341260789149e-07, "optim/total_tokens": 2002570444800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2563183307647705, "created_at": "2025-06-03T11:02:46.665574+00:00"} {"global_step": 238726, "acc_step": 0, "speed/wps": 5519.021219171094, "speed/FLOPS": 243912488975936.8, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04753788933157921, "optim/lr": 9.754869009845902e-07, "optim/total_tokens": 2002578833408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2540817260742188, "created_at": "2025-06-03T11:02:49.640844+00:00"} {"global_step": 238727, "acc_step": 0, "speed/wps": 5517.271880622736, "speed/FLOPS": 243835177166025.75, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.23 hours", "speed/est_time_elapsed_hrs": 196.86, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.23, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04850669205188751, "optim/lr": 9.719396758900434e-07, "optim/total_tokens": 2002587222016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2702627182006836, "created_at": "2025-06-03T11:02:52.616145+00:00"} {"global_step": 238728, "acc_step": 0, "speed/wps": 5513.260144978029, "speed/FLOPS": 243657878984454.16, "speed/curr_iter_time": 2.9708, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9708, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 197.0, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047501690685749054, "optim/lr": 9.683924507954965e-07, "optim/total_tokens": 2002595610624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2587130069732666, "created_at": "2025-06-03T11:02:55.596296+00:00"} {"global_step": 238729, "acc_step": 0, "speed/wps": 5526.810257567446, "speed/FLOPS": 244256724605142.9, "speed/curr_iter_time": 2.9636, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9636, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04801321402192116, "optim/lr": 9.648452257011719e-07, "optim/total_tokens": 2002603999232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.259885549545288, "created_at": "2025-06-03T11:02:58.565281+00:00"} {"global_step": 238730, "acc_step": 0, "speed/wps": 5511.287861353049, "speed/FLOPS": 243570714143292.8, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04755483940243721, "optim/lr": 9.612980006066253e-07, "optim/total_tokens": 2002612387840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2607828378677368, "created_at": "2025-06-03T11:03:01.545493+00:00"} {"global_step": 238731, "acc_step": 0, "speed/wps": 5519.664163581655, "speed/FLOPS": 243940903827995.78, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04747450724244118, "optim/lr": 9.577507755120784e-07, "optim/total_tokens": 2002620776448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2634073495864868, "created_at": "2025-06-03T11:03:04.518213+00:00"} {"global_step": 238732, "acc_step": 0, "speed/wps": 5512.622808818945, "speed/FLOPS": 243629711988404.84, "speed/curr_iter_time": 2.9712, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9712, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 197.03, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04746140167117119, "optim/lr": 9.542035504175316e-07, "optim/total_tokens": 2002629165056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2516416311264038, "created_at": "2025-06-03T11:03:07.498123+00:00"} {"global_step": 238733, "acc_step": 0, "speed/wps": 5533.565832503656, "speed/FLOPS": 244555286439156.28, "speed/curr_iter_time": 2.9587, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9587, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04835744574666023, "optim/lr": 9.50656325323207e-07, "optim/total_tokens": 2002637553664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.237302541732788, "created_at": "2025-06-03T11:03:10.467785+00:00"} {"global_step": 238734, "acc_step": 0, "speed/wps": 5517.448151953269, "speed/FLOPS": 243842967456596.84, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.86, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04728811979293823, "optim/lr": 9.471091002286602e-07, "optim/total_tokens": 2002645942272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 376, "loss/out": 1.256891131401062, "created_at": "2025-06-03T11:03:13.442877+00:00"} {"global_step": 238735, "acc_step": 0, "speed/wps": 5527.279115823066, "speed/FLOPS": 244277445740207.22, "speed/curr_iter_time": 2.9633, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9633, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048909761011600494, "optim/lr": 9.435618751341135e-07, "optim/total_tokens": 2002654330880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2654948234558105, "created_at": "2025-06-03T11:03:16.415016+00:00"} {"global_step": 238736, "acc_step": 0, "speed/wps": 5525.039007380363, "speed/FLOPS": 244178444412954.16, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04780801385641098, "optim/lr": 9.400146500395668e-07, "optim/total_tokens": 2002662719488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.267264723777771, "created_at": "2025-06-03T11:03:19.385090+00:00"} {"global_step": 238737, "acc_step": 0, "speed/wps": 5525.711348098717, "speed/FLOPS": 244208158431353.66, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047397028654813766, "optim/lr": 9.36467424945242e-07, "optim/total_tokens": 2002671108096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2594020366668701, "created_at": "2025-06-03T11:03:22.359301+00:00"} {"global_step": 238738, "acc_step": 0, "speed/wps": 5528.429866938474, "speed/FLOPS": 244328303049430.12, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04742851108312607, "optim/lr": 9.329201998506953e-07, "optim/total_tokens": 2002679496704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.25077223777771, "created_at": "2025-06-03T11:03:25.331340+00:00"} {"global_step": 238739, "acc_step": 0, "speed/wps": 5515.194129437896, "speed/FLOPS": 243743351198550.44, "speed/curr_iter_time": 2.9698, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9698, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.22 hours", "speed/est_time_elapsed_hrs": 196.95, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.22, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048075370490550995, "optim/lr": 9.293729747561486e-07, "optim/total_tokens": 2002687885312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2538697719573975, "created_at": "2025-06-03T11:03:28.306705+00:00"} {"global_step": 238740, "acc_step": 0, "speed/wps": 5517.816798081202, "speed/FLOPS": 243859259728549.56, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.75, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047496117651462555, "optim/lr": 9.258257496616018e-07, "optim/total_tokens": 2002696273920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.248241901397705, "created_at": "2025-06-03T11:03:31.280985+00:00"} {"global_step": 238741, "acc_step": 0, "speed/wps": 5506.810055596208, "speed/FLOPS": 243372818048328.0, "speed/curr_iter_time": 2.9744, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9744, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 197.25, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04713550582528114, "optim/lr": 9.222785245672771e-07, "optim/total_tokens": 2002704662528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.251110553741455, "created_at": "2025-06-03T11:03:34.264797+00:00"} {"global_step": 238742, "acc_step": 0, "speed/wps": 5530.0431873285725, "speed/FLOPS": 244399603552950.12, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04751570522785187, "optim/lr": 9.187312994727304e-07, "optim/total_tokens": 2002713051136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2507938146591187, "created_at": "2025-06-03T11:03:37.232515+00:00"} {"global_step": 238743, "acc_step": 0, "speed/wps": 5518.505934285475, "speed/FLOPS": 243889716021459.56, "speed/curr_iter_time": 2.9666, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9666, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047872643917798996, "optim/lr": 9.151840743781837e-07, "optim/total_tokens": 2002721439744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2470190525054932, "created_at": "2025-06-03T11:03:40.206942+00:00"} {"global_step": 238744, "acc_step": 0, "speed/wps": 5513.032291922049, "speed/FLOPS": 243647809045637.53, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 197.02, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0477626733481884, "optim/lr": 9.116368492836369e-07, "optim/total_tokens": 2002729828352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2569464445114136, "created_at": "2025-06-03T11:03:43.183264+00:00"} {"global_step": 238745, "acc_step": 0, "speed/wps": 5528.685941700685, "speed/FLOPS": 244339620243210.4, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0481310673058033, "optim/lr": 9.080896241893122e-07, "optim/total_tokens": 2002738216960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 395, "loss/out": 1.2564187049865723, "created_at": "2025-06-03T11:03:46.151312+00:00"} {"global_step": 238746, "acc_step": 0, "speed/wps": 5524.10860770326, "speed/FLOPS": 244137325509443.47, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.05274093151092529, "optim/lr": 9.045423990947655e-07, "optim/total_tokens": 2002746605568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2636958360671997, "created_at": "2025-06-03T11:03:49.121436+00:00"} {"global_step": 238747, "acc_step": 0, "speed/wps": 5520.489457654159, "speed/FLOPS": 243977377601762.47, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04777472838759422, "optim/lr": 9.009951740002186e-07, "optim/total_tokens": 2002754994176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2644296884536743, "created_at": "2025-06-03T11:03:52.097279+00:00"} {"global_step": 238748, "acc_step": 0, "speed/wps": 5521.862999362566, "speed/FLOPS": 244038081114850.25, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04684779420495033, "optim/lr": 8.974479489056719e-07, "optim/total_tokens": 2002763382784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.228014588356018, "created_at": "2025-06-03T11:03:55.072430+00:00"} {"global_step": 238749, "acc_step": 0, "speed/wps": 5530.328103240434, "speed/FLOPS": 244412195377922.56, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04756937175989151, "optim/lr": 8.939007238113472e-07, "optim/total_tokens": 2002771771392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2494142055511475, "created_at": "2025-06-03T11:03:58.043842+00:00"} {"global_step": 238750, "acc_step": 0, "speed/wps": 5527.127062194537, "speed/FLOPS": 244270725748107.25, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.21 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.21, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04766015708446503, "optim/lr": 8.903534987168005e-07, "optim/total_tokens": 2002780160000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2497869729995728, "created_at": "2025-06-03T11:04:01.012587+00:00"} {"global_step": 238751, "acc_step": 0, "speed/wps": 5527.63304843971, "speed/FLOPS": 244293087750271.56, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04724837467074394, "optim/lr": 8.868062736222537e-07, "optim/total_tokens": 2002788548608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.261983036994934, "created_at": "2025-06-03T11:04:03.985069+00:00"} {"global_step": 238752, "acc_step": 0, "speed/wps": 5524.680241392249, "speed/FLOPS": 244162588792610.3, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04719199240207672, "optim/lr": 8.83259048527707e-07, "optim/total_tokens": 2002796937216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.250105381011963, "created_at": "2025-06-03T11:04:06.956715+00:00"} {"global_step": 238753, "acc_step": 0, "speed/wps": 5516.388217145655, "speed/FLOPS": 243796123763338.47, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.83, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739557206630707, "optim/lr": 8.797118234333823e-07, "optim/total_tokens": 2002805325824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2473502159118652, "created_at": "2025-06-03T11:04:09.931061+00:00"} {"global_step": 238754, "acc_step": 0, "speed/wps": 5524.977603915877, "speed/FLOPS": 244175730694115.3, "speed/curr_iter_time": 2.9645, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9645, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04734477028250694, "optim/lr": 8.761645983388355e-07, "optim/total_tokens": 2002813714432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2665653228759766, "created_at": "2025-06-03T11:04:12.901082+00:00"} {"global_step": 238755, "acc_step": 0, "speed/wps": 5514.469867680226, "speed/FLOPS": 243711342535969.2, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04752027243375778, "optim/lr": 8.726173732442888e-07, "optim/total_tokens": 2002822103040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2512705326080322, "created_at": "2025-06-03T11:04:15.876487+00:00"} {"global_step": 238756, "acc_step": 0, "speed/wps": 5505.756426127388, "speed/FLOPS": 243326253018770.66, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 197.3, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04716748744249344, "optim/lr": 8.690701481499641e-07, "optim/total_tokens": 2002830491648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.262807011604309, "created_at": "2025-06-03T11:04:18.860750+00:00"} {"global_step": 238757, "acc_step": 0, "speed/wps": 5515.517327314314, "speed/FLOPS": 243757634890411.44, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.85, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0478789396584034, "optim/lr": 8.655229230554174e-07, "optim/total_tokens": 2002838880256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2537906169891357, "created_at": "2025-06-03T11:04:21.842507+00:00"} {"global_step": 238758, "acc_step": 0, "speed/wps": 5515.923545948049, "speed/FLOPS": 243775587674807.06, "speed/curr_iter_time": 2.9694, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9694, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04864020273089409, "optim/lr": 8.619756979608706e-07, "optim/total_tokens": 2002847268864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2534244060516357, "created_at": "2025-06-03T11:04:24.817630+00:00"} {"global_step": 238759, "acc_step": 0, "speed/wps": 5521.469749654227, "speed/FLOPS": 244020701490576.12, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04720531404018402, "optim/lr": 8.584284728663239e-07, "optim/total_tokens": 2002855657472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.261590600013733, "created_at": "2025-06-03T11:04:27.789142+00:00"} {"global_step": 238760, "acc_step": 0, "speed/wps": 5526.859803415439, "speed/FLOPS": 244258914278025.6, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047075025737285614, "optim/lr": 8.548812477719992e-07, "optim/total_tokens": 2002864046080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.250430703163147, "created_at": "2025-06-03T11:04:30.758221+00:00"} {"global_step": 238761, "acc_step": 0, "speed/wps": 5524.763740737713, "speed/FLOPS": 244166279036291.47, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04696349427103996, "optim/lr": 8.513340226774524e-07, "optim/total_tokens": 2002872434688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.25130033493042, "created_at": "2025-06-03T11:04:33.728427+00:00"} {"global_step": 238762, "acc_step": 0, "speed/wps": 5536.262434155673, "speed/FLOPS": 244674462429716.97, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.22, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047605566680431366, "optim/lr": 8.477867975829057e-07, "optim/total_tokens": 2002880823296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2729195356369019, "created_at": "2025-06-03T11:04:36.694808+00:00"} {"global_step": 238763, "acc_step": 0, "speed/wps": 5517.327862560425, "speed/FLOPS": 243837651281130.1, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.2 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.2, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047053832560777664, "optim/lr": 8.442395724883589e-07, "optim/total_tokens": 2002889211904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2538132667541504, "created_at": "2025-06-03T11:04:39.671963+00:00"} {"global_step": 238764, "acc_step": 0, "speed/wps": 5519.726293283783, "speed/FLOPS": 243943649642821.2, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04694930836558342, "optim/lr": 8.406923473940343e-07, "optim/total_tokens": 2002897600512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2555124759674072, "created_at": "2025-06-03T11:04:42.648438+00:00"} {"global_step": 238765, "acc_step": 0, "speed/wps": 5513.106096893007, "speed/FLOPS": 243651070847585.78, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047070734202861786, "optim/lr": 8.371451222994874e-07, "optim/total_tokens": 2002905989120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2566276788711548, "created_at": "2025-06-03T11:04:45.626132+00:00"} {"global_step": 238766, "acc_step": 0, "speed/wps": 5519.270249941823, "speed/FLOPS": 243923494861347.97, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04838716611266136, "optim/lr": 8.335978972049407e-07, "optim/total_tokens": 2002914377728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2581002712249756, "created_at": "2025-06-03T11:04:48.603014+00:00"} {"global_step": 238767, "acc_step": 0, "speed/wps": 5526.540645691041, "speed/FLOPS": 244244809140204.53, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04738220199942589, "optim/lr": 8.30050672110394e-07, "optim/total_tokens": 2002922766336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2646197080612183, "created_at": "2025-06-03T11:04:51.572947+00:00"} {"global_step": 238768, "acc_step": 0, "speed/wps": 5539.96442501096, "speed/FLOPS": 244838071477013.75, "speed/curr_iter_time": 2.9565, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9565, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.09, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047540027648210526, "optim/lr": 8.265034470160692e-07, "optim/total_tokens": 2002931154944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2484374046325684, "created_at": "2025-06-03T11:04:54.536044+00:00"} {"global_step": 238769, "acc_step": 0, "speed/wps": 5502.6225235180045, "speed/FLOPS": 243187750564203.6, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 197.42, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04789149388670921, "optim/lr": 8.229562219215225e-07, "optim/total_tokens": 2002939543552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2701635360717773, "created_at": "2025-06-03T11:04:57.518034+00:00"} {"global_step": 238770, "acc_step": 0, "speed/wps": 5528.57212974534, "speed/FLOPS": 244334590337326.53, "speed/curr_iter_time": 2.9611, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9611, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.39, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04773946478962898, "optim/lr": 8.194089968269758e-07, "optim/total_tokens": 2002947932160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2587637901306152, "created_at": "2025-06-03T11:05:00.486130+00:00"} {"global_step": 238771, "acc_step": 0, "speed/wps": 5520.076642069806, "speed/FLOPS": 243959133265915.78, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047625359147787094, "optim/lr": 8.15861771732429e-07, "optim/total_tokens": 2002956320768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2531063556671143, "created_at": "2025-06-03T11:05:03.464454+00:00"} {"global_step": 238772, "acc_step": 0, "speed/wps": 5520.483157541547, "speed/FLOPS": 243977099169031.9, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.79, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04781505838036537, "optim/lr": 8.123145466381043e-07, "optim/total_tokens": 2002964709376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2616480588912964, "created_at": "2025-06-03T11:05:06.436898+00:00"} {"global_step": 238773, "acc_step": 0, "speed/wps": 5528.0836015283385, "speed/FLOPS": 244312999890649.16, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04720241576433182, "optim/lr": 8.087673215435576e-07, "optim/total_tokens": 2002973097984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2560415267944336, "created_at": "2025-06-03T11:05:09.410162+00:00"} {"global_step": 238774, "acc_step": 0, "speed/wps": 5534.79617751254, "speed/FLOPS": 244609661391072.34, "speed/curr_iter_time": 2.9578, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9578, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04797949641942978, "optim/lr": 8.052200964490109e-07, "optim/total_tokens": 2002981486592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2552247047424316, "created_at": "2025-06-03T11:05:12.378506+00:00"} {"global_step": 238775, "acc_step": 0, "speed/wps": 5517.191926255666, "speed/FLOPS": 243831643592244.78, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.19 hours", "speed/est_time_elapsed_hrs": 196.9, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.19, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047495950013399124, "optim/lr": 8.016728713544641e-07, "optim/total_tokens": 2002989875200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.269730806350708, "created_at": "2025-06-03T11:05:15.353115+00:00"} {"global_step": 238776, "acc_step": 0, "speed/wps": 5527.712102924866, "speed/FLOPS": 244296581553877.88, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04784153774380684, "optim/lr": 7.981256462601394e-07, "optim/total_tokens": 2002998263808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.256404161453247, "created_at": "2025-06-03T11:05:18.321735+00:00"} {"global_step": 238777, "acc_step": 0, "speed/wps": 5528.0636230029795, "speed/FLOPS": 244312116942087.66, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.42, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04721962288022041, "optim/lr": 7.945784211655927e-07, "optim/total_tokens": 2003006652416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2474730014801025, "created_at": "2025-06-03T11:05:21.293127+00:00"} {"global_step": 238778, "acc_step": 0, "speed/wps": 5518.419659563147, "speed/FLOPS": 243885903120326.75, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04789884760975838, "optim/lr": 7.910311960710458e-07, "optim/total_tokens": 2003015041024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2543635368347168, "created_at": "2025-06-03T11:05:24.268504+00:00"} {"global_step": 238779, "acc_step": 0, "speed/wps": 5521.799913801447, "speed/FLOPS": 244035293055949.94, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.75, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047539182007312775, "optim/lr": 7.874839709764991e-07, "optim/total_tokens": 2003023429632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.247178554534912, "created_at": "2025-06-03T11:05:27.240397+00:00"} {"global_step": 238780, "acc_step": 0, "speed/wps": 5520.170729925759, "speed/FLOPS": 243963291467563.56, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.06605421006679535, "optim/lr": 7.839367458821745e-07, "optim/total_tokens": 2003031818240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2531057596206665, "created_at": "2025-06-03T11:05:30.216558+00:00"} {"global_step": 238781, "acc_step": 0, "speed/wps": 5516.898468218364, "speed/FLOPS": 243818674249050.44, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.92, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04731474816799164, "optim/lr": 7.803895207876277e-07, "optim/total_tokens": 2003040206848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.264093041419983, "created_at": "2025-06-03T11:05:33.192047+00:00"} {"global_step": 238782, "acc_step": 0, "speed/wps": 5509.96548648038, "speed/FLOPS": 243512271942449.0, "speed/curr_iter_time": 2.9727, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9727, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 197.17, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04892297834157944, "optim/lr": 7.768422956930809e-07, "optim/total_tokens": 2003048595456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2523183822631836, "created_at": "2025-06-03T11:05:36.172880+00:00"} {"global_step": 238783, "acc_step": 0, "speed/wps": 5517.874195546805, "speed/FLOPS": 243861796402742.34, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.88, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046791236847639084, "optim/lr": 7.732950705987562e-07, "optim/total_tokens": 2003056984064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2544808387756348, "created_at": "2025-06-03T11:05:39.147092+00:00"} {"global_step": 238784, "acc_step": 0, "speed/wps": 5533.1455152708495, "speed/FLOPS": 244536710568844.88, "speed/curr_iter_time": 2.9585, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9585, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0476783849298954, "optim/lr": 7.697478455042095e-07, "optim/total_tokens": 2003065372672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.267391324043274, "created_at": "2025-06-03T11:05:42.112973+00:00"} {"global_step": 238785, "acc_step": 0, "speed/wps": 5534.304860393533, "speed/FLOPS": 244587947689201.22, "speed/curr_iter_time": 2.9595, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9595, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.3, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04728994518518448, "optim/lr": 7.662006204096627e-07, "optim/total_tokens": 2003073761280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.26687490940094, "created_at": "2025-06-03T11:05:45.078072+00:00"} {"global_step": 238786, "acc_step": 0, "speed/wps": 5531.620140035781, "speed/FLOPS": 244469296791033.1, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.4, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04767068102955818, "optim/lr": 7.62653395315116e-07, "optim/total_tokens": 2003082149888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2563222646713257, "created_at": "2025-06-03T11:05:48.046892+00:00"} {"global_step": 238787, "acc_step": 0, "speed/wps": 5529.901147351525, "speed/FLOPS": 244393326112991.12, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.18 hours", "speed/est_time_elapsed_hrs": 196.36, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.18, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04735828563570976, "optim/lr": 7.591061702207913e-07, "optim/total_tokens": 2003090538496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.245865821838379, "created_at": "2025-06-03T11:05:51.015541+00:00"} {"global_step": 238788, "acc_step": 0, "speed/wps": 5527.714063434314, "speed/FLOPS": 244296668198360.7, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047688569873571396, "optim/lr": 7.555589451262446e-07, "optim/total_tokens": 2003098927104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2561177015304565, "created_at": "2025-06-03T11:05:53.988255+00:00"} {"global_step": 238789, "acc_step": 0, "speed/wps": 5521.064731482723, "speed/FLOPS": 244002801760466.6, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04799109697341919, "optim/lr": 7.520117200316978e-07, "optim/total_tokens": 2003107315712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2501850128173828, "created_at": "2025-06-03T11:05:56.960619+00:00"} {"global_step": 238790, "acc_step": 0, "speed/wps": 5520.78897147319, "speed/FLOPS": 243990614579512.9, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047460708767175674, "optim/lr": 7.484644949371511e-07, "optim/total_tokens": 2003115704320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2367130517959595, "created_at": "2025-06-03T11:05:59.933887+00:00"} {"global_step": 238791, "acc_step": 0, "speed/wps": 5530.481298852706, "speed/FLOPS": 244418965839858.75, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04688120260834694, "optim/lr": 7.449172698428264e-07, "optim/total_tokens": 2003124092928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2681697607040405, "created_at": "2025-06-03T11:06:02.906440+00:00"} {"global_step": 238792, "acc_step": 0, "speed/wps": 5518.269325851723, "speed/FLOPS": 243879259139759.47, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.88, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.048397842794656754, "optim/lr": 7.413700447482796e-07, "optim/total_tokens": 2003132481536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2529041767120361, "created_at": "2025-06-03T11:06:05.880506+00:00"} {"global_step": 238793, "acc_step": 0, "speed/wps": 5525.836695807109, "speed/FLOPS": 244213698158476.88, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047559164464473724, "optim/lr": 7.378228196537329e-07, "optim/total_tokens": 2003140870144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2580095529556274, "created_at": "2025-06-03T11:06:08.852359+00:00"} {"global_step": 238794, "acc_step": 0, "speed/wps": 5534.432851284278, "speed/FLOPS": 244593604231455.34, "speed/curr_iter_time": 2.958, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.958, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.21, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04781878739595413, "optim/lr": 7.342755945591862e-07, "optim/total_tokens": 2003149258752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2591447830200195, "created_at": "2025-06-03T11:06:11.817563+00:00"} {"global_step": 238795, "acc_step": 0, "speed/wps": 5540.264218149401, "speed/FLOPS": 244851320799252.44, "speed/curr_iter_time": 2.9564, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9564, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.1, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04877496510744095, "optim/lr": 7.307283694648615e-07, "optim/total_tokens": 2003157647360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.252793550491333, "created_at": "2025-06-03T11:06:14.779364+00:00"} {"global_step": 238796, "acc_step": 0, "speed/wps": 5529.63792245229, "speed/FLOPS": 244381692919752.1, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04785245284438133, "optim/lr": 7.271811443703146e-07, "optim/total_tokens": 2003166035968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2457374334335327, "created_at": "2025-06-03T11:06:17.747258+00:00"} {"global_step": 238797, "acc_step": 0, "speed/wps": 5527.994096654312, "speed/FLOPS": 244309044233344.66, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.44, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04783518239855766, "optim/lr": 7.236339192757679e-07, "optim/total_tokens": 2003174424576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2531105279922485, "created_at": "2025-06-03T11:06:20.716201+00:00"} {"global_step": 238798, "acc_step": 0, "speed/wps": 5516.824972129092, "speed/FLOPS": 243815426098091.72, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04903901740908623, "optim/lr": 7.200866941812212e-07, "optim/total_tokens": 2003182813184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2421904802322388, "created_at": "2025-06-03T11:06:23.694250+00:00"} {"global_step": 238799, "acc_step": 0, "speed/wps": 5509.650881620091, "speed/FLOPS": 243498368017917.9, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.17 hours", "speed/est_time_elapsed_hrs": 197.19, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.17, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04733944684267044, "optim/lr": 7.165394690868964e-07, "optim/total_tokens": 2003191201792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.260589599609375, "created_at": "2025-06-03T11:06:26.675668+00:00"} {"global_step": 238800, "acc_step": 0, "speed/wps": 5517.354842114156, "speed/FLOPS": 243838843639311.1, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.84, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046928372234106064, "optim/lr": 7.129922439923497e-07, "optim/total_tokens": 2003199590400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2553722858428955, "created_at": "2025-06-03T11:06:29.649721+00:00"} {"global_step": 238801, "acc_step": 0, "speed/wps": 5529.426450403783, "speed/FLOPS": 244372346937620.16, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04674874246120453, "optim/lr": 7.09445018897803e-07, "optim/total_tokens": 2003207979008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2647167444229126, "created_at": "2025-06-03T11:06:32.617321+00:00"} {"global_step": 238802, "acc_step": 0, "speed/wps": 5523.815797078186, "speed/FLOPS": 244124384778555.84, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04798639938235283, "optim/lr": 7.058977938032563e-07, "optim/total_tokens": 2003216367616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2429862022399902, "created_at": "2025-06-03T11:06:35.591261+00:00"} {"global_step": 238803, "acc_step": 0, "speed/wps": 5536.777221641729, "speed/FLOPS": 244697213401679.4, "speed/curr_iter_time": 2.9582, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9582, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.23, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04753878340125084, "optim/lr": 7.023505687089315e-07, "optim/total_tokens": 2003224756224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2490909099578857, "created_at": "2025-06-03T11:06:38.558828+00:00"} {"global_step": 238804, "acc_step": 0, "speed/wps": 5521.889422291234, "speed/FLOPS": 244039248873052.56, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04808987304568291, "optim/lr": 6.988033436143848e-07, "optim/total_tokens": 2003233144832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2648807764053345, "created_at": "2025-06-03T11:06:41.533575+00:00"} {"global_step": 238805, "acc_step": 0, "speed/wps": 5523.843175304237, "speed/FLOPS": 244125594756012.84, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04764733463525772, "optim/lr": 6.952561185198381e-07, "optim/total_tokens": 2003241533440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2394462823867798, "created_at": "2025-06-03T11:06:44.507966+00:00"} {"global_step": 238806, "acc_step": 0, "speed/wps": 5520.626378976406, "speed/FLOPS": 243983428823378.9, "speed/curr_iter_time": 2.9669, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9669, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047071706503629684, "optim/lr": 6.917088934252913e-07, "optim/total_tokens": 2003249922048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2511616945266724, "created_at": "2025-06-03T11:06:47.484952+00:00"} {"global_step": 238807, "acc_step": 0, "speed/wps": 5523.38616488667, "speed/FLOPS": 244105397234747.72, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0471283458173275, "optim/lr": 6.881616683309666e-07, "optim/total_tokens": 2003258310656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2418694496154785, "created_at": "2025-06-03T11:06:50.455805+00:00"} {"global_step": 238808, "acc_step": 0, "speed/wps": 5528.338082833792, "speed/FLOPS": 244324246661796.8, "speed/curr_iter_time": 2.9627, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9627, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047709427773952484, "optim/lr": 6.846144432364199e-07, "optim/total_tokens": 2003266699264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2551568746566772, "created_at": "2025-06-03T11:06:53.425702+00:00"} {"global_step": 238809, "acc_step": 0, "speed/wps": 5529.751927341242, "speed/FLOPS": 244386731352313.84, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.49, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04918653517961502, "optim/lr": 6.810672181418732e-07, "optim/total_tokens": 2003275087872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2540638446807861, "created_at": "2025-06-03T11:06:56.395706+00:00"} {"global_step": 238810, "acc_step": 0, "speed/wps": 5530.816598765451, "speed/FLOPS": 244433784379781.56, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.45, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04721645265817642, "optim/lr": 6.775199930475484e-07, "optim/total_tokens": 2003283476480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.247408390045166, "created_at": "2025-06-03T11:06:59.362636+00:00"} {"global_step": 238811, "acc_step": 0, "speed/wps": 5524.523501235616, "speed/FLOPS": 244155661679956.0, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.16 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.16, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04762575775384903, "optim/lr": 6.739727679530017e-07, "optim/total_tokens": 2003291865088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.2377148866653442, "created_at": "2025-06-03T11:07:02.335569+00:00"} {"global_step": 238812, "acc_step": 0, "speed/wps": 5525.740400056192, "speed/FLOPS": 244209442379172.66, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047002971172332764, "optim/lr": 6.70425542858455e-07, "optim/total_tokens": 2003300253696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.257171392440796, "created_at": "2025-06-03T11:07:05.304780+00:00"} {"global_step": 238813, "acc_step": 0, "speed/wps": 5515.656508314715, "speed/FLOPS": 243763785978236.25, "speed/curr_iter_time": 2.9696, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9696, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04757412150502205, "optim/lr": 6.668783177639081e-07, "optim/total_tokens": 2003308642304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2534592151641846, "created_at": "2025-06-03T11:07:08.279490+00:00"} {"global_step": 238814, "acc_step": 0, "speed/wps": 5527.561540822114, "speed/FLOPS": 244289927479582.94, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04703656956553459, "optim/lr": 6.633310926695835e-07, "optim/total_tokens": 2003317030912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 415, "loss/out": 1.250744342803955, "created_at": "2025-06-03T11:07:11.250863+00:00"} {"global_step": 238815, "acc_step": 0, "speed/wps": 5520.346410486411, "speed/FLOPS": 243971055649129.75, "speed/curr_iter_time": 2.9671, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9671, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.83, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04932175576686859, "optim/lr": 6.597838675750367e-07, "optim/total_tokens": 2003325419520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2465900182724, "created_at": "2025-06-03T11:07:14.223218+00:00"} {"global_step": 238816, "acc_step": 0, "speed/wps": 5526.859402318789, "speed/FLOPS": 244258896551606.62, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04755084216594696, "optim/lr": 6.5623664248049e-07, "optim/total_tokens": 2003333808128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.227704405784607, "created_at": "2025-06-03T11:07:17.196397+00:00"} {"global_step": 238817, "acc_step": 0, "speed/wps": 5528.151225330997, "speed/FLOPS": 244315988516596.62, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047287702560424805, "optim/lr": 6.526894173859432e-07, "optim/total_tokens": 2003342196736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2448673248291016, "created_at": "2025-06-03T11:07:20.166795+00:00"} {"global_step": 238818, "acc_step": 0, "speed/wps": 5524.7525181365945, "speed/FLOPS": 244165783054764.5, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04699251428246498, "optim/lr": 6.491421922916185e-07, "optim/total_tokens": 2003350585344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2541332244873047, "created_at": "2025-06-03T11:07:23.136666+00:00"} {"global_step": 238819, "acc_step": 0, "speed/wps": 5524.295338597037, "speed/FLOPS": 244145578059173.06, "speed/curr_iter_time": 2.9649, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9649, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04721621423959732, "optim/lr": 6.455949671970718e-07, "optim/total_tokens": 2003358973952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2514145374298096, "created_at": "2025-06-03T11:07:26.107180+00:00"} {"global_step": 238820, "acc_step": 0, "speed/wps": 5536.989747779949, "speed/FLOPS": 244706605969181.34, "speed/curr_iter_time": 2.9581, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9581, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.24, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04858613759279251, "optim/lr": 6.42047742102525e-07, "optim/total_tokens": 2003367362560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 407, "loss/out": 1.2535804510116577, "created_at": "2025-06-03T11:07:29.070160+00:00"} {"global_step": 238821, "acc_step": 0, "speed/wps": 5520.5691581137025, "speed/FLOPS": 243980899954130.34, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047176264226436615, "optim/lr": 6.385005170079783e-07, "optim/total_tokens": 2003375751168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2526923418045044, "created_at": "2025-06-03T11:07:32.044399+00:00"} {"global_step": 238822, "acc_step": 0, "speed/wps": 5524.845072016808, "speed/FLOPS": 244169873462536.25, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04748169332742691, "optim/lr": 6.349532919136536e-07, "optim/total_tokens": 2003384139776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.254320502281189, "created_at": "2025-06-03T11:07:35.017321+00:00"} {"global_step": 238823, "acc_step": 0, "speed/wps": 5513.639275619925, "speed/FLOPS": 243674634618259.44, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 197.07, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04869180545210838, "optim/lr": 6.314060668191069e-07, "optim/total_tokens": 2003392528384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2609028816223145, "created_at": "2025-06-03T11:07:37.993413+00:00"} {"global_step": 238824, "acc_step": 0, "speed/wps": 5514.785567262371, "speed/FLOPS": 243725294841603.03, "speed/curr_iter_time": 2.9686, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9686, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.15 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.15, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04713628813624382, "optim/lr": 6.278588417245601e-07, "optim/total_tokens": 2003400916992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2582343816757202, "created_at": "2025-06-03T11:07:40.973322+00:00"} {"global_step": 238825, "acc_step": 0, "speed/wps": 5536.632247922858, "speed/FLOPS": 244690806305348.1, "speed/curr_iter_time": 2.9583, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9583, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.25, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04676501825451851, "optim/lr": 6.243116166300134e-07, "optim/total_tokens": 2003409305600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.269212245941162, "created_at": "2025-06-03T11:07:43.937119+00:00"} {"global_step": 238826, "acc_step": 0, "speed/wps": 5530.70746589948, "speed/FLOPS": 244428961265698.28, "speed/curr_iter_time": 2.9615, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9615, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04853293299674988, "optim/lr": 6.207643915356887e-07, "optim/total_tokens": 2003417694208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2395137548446655, "created_at": "2025-06-03T11:07:46.903858+00:00"} {"global_step": 238827, "acc_step": 0, "speed/wps": 5526.128443546545, "speed/FLOPS": 244226591915259.62, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0475577749311924, "optim/lr": 6.172171664411419e-07, "optim/total_tokens": 2003426082816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2538557052612305, "created_at": "2025-06-03T11:07:49.873958+00:00"} {"global_step": 238828, "acc_step": 0, "speed/wps": 5527.718382639107, "speed/FLOPS": 244296859085104.88, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739346355199814, "optim/lr": 6.136699413465951e-07, "optim/total_tokens": 2003434471424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2544053792953491, "created_at": "2025-06-03T11:07:52.845512+00:00"} {"global_step": 238829, "acc_step": 0, "speed/wps": 5522.072106626549, "speed/FLOPS": 244047322585610.28, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04719047248363495, "optim/lr": 6.101227162520484e-07, "optim/total_tokens": 2003442860032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2531559467315674, "created_at": "2025-06-03T11:07:55.819500+00:00"} {"global_step": 238830, "acc_step": 0, "speed/wps": 5525.231620157958, "speed/FLOPS": 244186956911842.3, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04709477722644806, "optim/lr": 6.065754911577238e-07, "optim/total_tokens": 2003451248640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2480003833770752, "created_at": "2025-06-03T11:07:58.792673+00:00"} {"global_step": 238831, "acc_step": 0, "speed/wps": 5516.148464197453, "speed/FLOPS": 243785527910194.78, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.9, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04782630130648613, "optim/lr": 6.030282660631769e-07, "optim/total_tokens": 2003459637248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2497860193252563, "created_at": "2025-06-03T11:08:01.767418+00:00"} {"global_step": 238832, "acc_step": 0, "speed/wps": 5523.86429063208, "speed/FLOPS": 244126527945425.47, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.046820539981126785, "optim/lr": 5.994810409686302e-07, "optim/total_tokens": 2003468025856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2492022514343262, "created_at": "2025-06-03T11:08:04.737680+00:00"} {"global_step": 238833, "acc_step": 0, "speed/wps": 5532.647681263782, "speed/FLOPS": 244514708853877.94, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04749530926346779, "optim/lr": 5.959338158740835e-07, "optim/total_tokens": 2003476414464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2467619180679321, "created_at": "2025-06-03T11:08:07.703072+00:00"} {"global_step": 238834, "acc_step": 0, "speed/wps": 5515.512655371807, "speed/FLOPS": 243757428414465.8, "speed/curr_iter_time": 2.9683, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9683, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047560740262269974, "optim/lr": 5.923865907797587e-07, "optim/total_tokens": 2003484803072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2591567039489746, "created_at": "2025-06-03T11:08:10.678924+00:00"} {"global_step": 238835, "acc_step": 0, "speed/wps": 5524.796387735757, "speed/FLOPS": 244167721866502.5, "speed/curr_iter_time": 2.9646, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9646, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0474906824529171, "optim/lr": 5.88839365685212e-07, "optim/total_tokens": 2003493191680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.243440866470337, "created_at": "2025-06-03T11:08:13.652343+00:00"} {"global_step": 238836, "acc_step": 0, "speed/wps": 5519.796395074018, "speed/FLOPS": 243946747783136.06, "speed/curr_iter_time": 2.9674, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9674, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.14 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.14, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04833905026316643, "optim/lr": 5.852921405906653e-07, "optim/total_tokens": 2003501580288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.22843337059021, "created_at": "2025-06-03T11:08:16.628525+00:00"} {"global_step": 238837, "acc_step": 0, "speed/wps": 5519.030808699128, "speed/FLOPS": 243912912783992.25, "speed/curr_iter_time": 2.9678, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9678, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.89, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04743945598602295, "optim/lr": 5.817449154963406e-07, "optim/total_tokens": 2003509968896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2588335275650024, "created_at": "2025-06-03T11:08:19.601390+00:00"} {"global_step": 238838, "acc_step": 0, "speed/wps": 5529.830663514326, "speed/FLOPS": 244390211088155.94, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.41, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0472453236579895, "optim/lr": 5.781976904017938e-07, "optim/total_tokens": 2003518357504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2423584461212158, "created_at": "2025-06-03T11:08:22.568970+00:00"} {"global_step": 238839, "acc_step": 0, "speed/wps": 5524.408478811625, "speed/FLOPS": 244150578277553.75, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.7, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04756776988506317, "optim/lr": 5.746504653072471e-07, "optim/total_tokens": 2003526746112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.259002447128296, "created_at": "2025-06-03T11:08:25.539092+00:00"} {"global_step": 238840, "acc_step": 0, "speed/wps": 5510.476289897596, "speed/FLOPS": 243534846838961.06, "speed/curr_iter_time": 2.9722, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9722, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 197.19, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047737233340740204, "optim/lr": 5.711032402127004e-07, "optim/total_tokens": 2003535134720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2598607540130615, "created_at": "2025-06-03T11:08:28.517607+00:00"} {"global_step": 238841, "acc_step": 0, "speed/wps": 5515.832130372969, "speed/FLOPS": 243771547574295.88, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.92, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047357384115457535, "optim/lr": 5.675560151183756e-07, "optim/total_tokens": 2003543523328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2423824071884155, "created_at": "2025-06-03T11:08:31.492386+00:00"} {"global_step": 238842, "acc_step": 0, "speed/wps": 5527.985737055843, "speed/FLOPS": 244308674781880.62, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047045253217220306, "optim/lr": 5.640087900238289e-07, "optim/total_tokens": 2003551911936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2667874097824097, "created_at": "2025-06-03T11:08:34.460546+00:00"} {"global_step": 238843, "acc_step": 0, "speed/wps": 5525.832463724043, "speed/FLOPS": 244213511122067.1, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0478094182908535, "optim/lr": 5.604615649292822e-07, "optim/total_tokens": 2003560300544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.248497486114502, "created_at": "2025-06-03T11:08:37.430504+00:00"} {"global_step": 238844, "acc_step": 0, "speed/wps": 5524.54461135562, "speed/FLOPS": 244156594639208.78, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047382455319166183, "optim/lr": 5.569143398347353e-07, "optim/total_tokens": 2003568689152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2497104406356812, "created_at": "2025-06-03T11:08:40.400827+00:00"} {"global_step": 238845, "acc_step": 0, "speed/wps": 5521.01671287639, "speed/FLOPS": 244000679583848.16, "speed/curr_iter_time": 2.9667, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9667, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.83, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047081563621759415, "optim/lr": 5.533671147404107e-07, "optim/total_tokens": 2003577077760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2463226318359375, "created_at": "2025-06-03T11:08:43.375827+00:00"} {"global_step": 238846, "acc_step": 0, "speed/wps": 5521.37564133893, "speed/FLOPS": 244016542384730.03, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0467144250869751, "optim/lr": 5.49819889645864e-07, "optim/total_tokens": 2003585466368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2622963190078735, "created_at": "2025-06-03T11:08:46.353841+00:00"} {"global_step": 238847, "acc_step": 0, "speed/wps": 5517.694090114354, "speed/FLOPS": 243853836664491.2, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.95, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04704359918832779, "optim/lr": 5.462726645513172e-07, "optim/total_tokens": 2003593854976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2565041780471802, "created_at": "2025-06-03T11:08:49.328647+00:00"} {"global_step": 238848, "acc_step": 0, "speed/wps": 5516.728382545375, "speed/FLOPS": 243811157332881.75, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.13 hours", "speed/est_time_elapsed_hrs": 196.89, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.13, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04729054495692253, "optim/lr": 5.427254394567704e-07, "optim/total_tokens": 2003602243584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 399, "loss/out": 1.2483925819396973, "created_at": "2025-06-03T11:08:52.303418+00:00"} {"global_step": 238849, "acc_step": 0, "speed/wps": 5507.403168481318, "speed/FLOPS": 243399030602022.9, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 197.32, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04712621495127678, "optim/lr": 5.391782143624457e-07, "optim/total_tokens": 2003610632192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2543011903762817, "created_at": "2025-06-03T11:08:55.283588+00:00"} {"global_step": 238850, "acc_step": 0, "speed/wps": 5514.09182918505, "speed/FLOPS": 243694635169458.84, "speed/curr_iter_time": 2.9704, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9704, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 197.08, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.047371380031108856, "optim/lr": 5.35630989267899e-07, "optim/total_tokens": 2003619020800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2509516477584839, "created_at": "2025-06-03T11:08:58.264157+00:00"} {"global_step": 238851, "acc_step": 0, "speed/wps": 5510.194442652233, "speed/FLOPS": 243522390633341.0, "speed/curr_iter_time": 2.9711, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9711, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 197.13, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.0471944734454155, "optim/lr": 5.320837641733522e-07, "optim/total_tokens": 2003627409408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2535338401794434, "created_at": "2025-06-03T11:09:01.242446+00:00"} {"global_step": 238852, "acc_step": 0, "speed/wps": 5522.634482238483, "speed/FLOPS": 244072176709158.44, "speed/curr_iter_time": 2.9656, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9656, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04725426435470581, "optim/lr": 5.285365390788055e-07, "optim/total_tokens": 2003635798016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 422, "loss/out": 1.2419520616531372, "created_at": "2025-06-03T11:09:04.213998+00:00"} {"global_step": 238853, "acc_step": 0, "speed/wps": 5522.471283913217, "speed/FLOPS": 244064964178506.47, "speed/curr_iter_time": 2.9659, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9659, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04739644378423691, "optim/lr": 5.249893139844808e-07, "optim/total_tokens": 2003644186624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.257608413696289, "created_at": "2025-06-03T11:09:07.185699+00:00"} {"global_step": 238854, "acc_step": 0, "speed/wps": 5519.252312090801, "speed/FLOPS": 243922702100147.03, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.01, "optim/grad_norm": 0.04762335866689682, "optim/lr": 5.214420888899341e-07, "optim/total_tokens": 2003652575232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 379, "loss/out": 1.2433910369873047, "created_at": "2025-06-03T11:09:10.162524+00:00"} {"global_step": 238855, "acc_step": 0, "speed/wps": 5516.979813336049, "speed/FLOPS": 243822269286890.1, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04735634848475456, "optim/lr": 5.178948637953873e-07, "optim/total_tokens": 2003660963840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.260229468345642, "created_at": "2025-06-03T11:09:13.141701+00:00"} {"global_step": 238856, "acc_step": 0, "speed/wps": 5513.718780565872, "speed/FLOPS": 243678148329927.1, "speed/curr_iter_time": 2.9706, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9706, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 197.1, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04711372032761574, "optim/lr": 5.143476387008406e-07, "optim/total_tokens": 2003669352448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2367630004882812, "created_at": "2025-06-03T11:09:16.118062+00:00"} {"global_step": 238857, "acc_step": 0, "speed/wps": 5506.901911023977, "speed/FLOPS": 243376877588076.7, "speed/curr_iter_time": 2.9743, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9743, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 197.34, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04667413979768753, "optim/lr": 5.108004136065159e-07, "optim/total_tokens": 2003677741056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2671138048171997, "created_at": "2025-06-03T11:09:19.099846+00:00"} {"global_step": 238858, "acc_step": 0, "speed/wps": 5519.203715069881, "speed/FLOPS": 243920554360564.47, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04805147647857666, "optim/lr": 5.072531885119691e-07, "optim/total_tokens": 2003686129664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2431771755218506, "created_at": "2025-06-03T11:09:22.073861+00:00"} {"global_step": 238859, "acc_step": 0, "speed/wps": 5527.640221143986, "speed/FLOPS": 244293404747087.3, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.6, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04770216345787048, "optim/lr": 5.037059634174224e-07, "optim/total_tokens": 2003694518272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 380, "loss/out": 1.262157917022705, "created_at": "2025-06-03T11:09:25.045576+00:00"} {"global_step": 238860, "acc_step": 0, "speed/wps": 5523.940481641223, "speed/FLOPS": 244129895198048.66, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.12 hours", "speed/est_time_elapsed_hrs": 196.73, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.12, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047367293387651443, "optim/lr": 5.001587383228756e-07, "optim/total_tokens": 2003702906880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.246981143951416, "created_at": "2025-06-03T11:09:28.017986+00:00"} {"global_step": 238861, "acc_step": 0, "speed/wps": 5517.542463879401, "speed/FLOPS": 243847135560999.7, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04966909810900688, "optim/lr": 4.96611513228551e-07, "optim/total_tokens": 2003711295488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2349283695220947, "created_at": "2025-06-03T11:09:30.991888+00:00"} {"global_step": 238862, "acc_step": 0, "speed/wps": 5530.098362675368, "speed/FLOPS": 244402042020865.44, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.52, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047257207334041595, "optim/lr": 4.930642881340041e-07, "optim/total_tokens": 2003719684096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.248173713684082, "created_at": "2025-06-03T11:09:33.963804+00:00"} {"global_step": 238863, "acc_step": 0, "speed/wps": 5518.128375125365, "speed/FLOPS": 243873029839105.7, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04733022674918175, "optim/lr": 4.895170630394574e-07, "optim/total_tokens": 2003728072704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2673742771148682, "created_at": "2025-06-03T11:09:36.942659+00:00"} {"global_step": 238864, "acc_step": 0, "speed/wps": 5515.215122500246, "speed/FLOPS": 243744278984454.12, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.96, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04782368615269661, "optim/lr": 4.859698379449107e-07, "optim/total_tokens": 2003736461312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.2644697427749634, "created_at": "2025-06-03T11:09:39.917948+00:00"} {"global_step": 238865, "acc_step": 0, "speed/wps": 5516.912200023593, "speed/FLOPS": 243819281124555.8, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04671582207083702, "optim/lr": 4.824226128505859e-07, "optim/total_tokens": 2003744849920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2515157461166382, "created_at": "2025-06-03T11:09:42.897493+00:00"} {"global_step": 238866, "acc_step": 0, "speed/wps": 5507.060767993974, "speed/FLOPS": 243383898253046.88, "speed/curr_iter_time": 2.9742, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9742, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 197.34, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04703928157687187, "optim/lr": 4.788753877560392e-07, "optim/total_tokens": 2003753238528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2641150951385498, "created_at": "2025-06-03T11:09:45.880704+00:00"} {"global_step": 238867, "acc_step": 0, "speed/wps": 5509.98657738649, "speed/FLOPS": 243513204052546.03, "speed/curr_iter_time": 2.9726, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9726, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 197.24, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0470825619995594, "optim/lr": 4.7532816266149246e-07, "optim/total_tokens": 2003761627136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2492951154708862, "created_at": "2025-06-03T11:09:48.858772+00:00"} {"global_step": 238868, "acc_step": 0, "speed/wps": 5521.908978801067, "speed/FLOPS": 244040113170687.88, "speed/curr_iter_time": 2.9648, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9648, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04796326532959938, "optim/lr": 4.7178093756716777e-07, "optim/total_tokens": 2003770015744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2656230926513672, "created_at": "2025-06-03T11:09:51.833989+00:00"} {"global_step": 238869, "acc_step": 0, "speed/wps": 5530.887938054375, "speed/FLOPS": 244436937211204.4, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04715484008193016, "optim/lr": 4.68233712472621e-07, "optim/total_tokens": 2003778404352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 418, "loss/out": 1.2466330528259277, "created_at": "2025-06-03T11:09:54.805115+00:00"} {"global_step": 238870, "acc_step": 0, "speed/wps": 5518.272996778664, "speed/FLOPS": 243879421375940.75, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.94, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04836822301149368, "optim/lr": 4.646864873780743e-07, "optim/total_tokens": 2003786792960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2578811645507812, "created_at": "2025-06-03T11:09:57.779015+00:00"} {"global_step": 238871, "acc_step": 0, "speed/wps": 5519.642737885121, "speed/FLOPS": 243939956921875.62, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04725060984492302, "optim/lr": 4.6113926228352753e-07, "optim/total_tokens": 2003795181568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2598387002944946, "created_at": "2025-06-03T11:10:00.751807+00:00"} {"global_step": 238872, "acc_step": 0, "speed/wps": 5528.735718828013, "speed/FLOPS": 244341820137455.84, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.11 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.11, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04738585278391838, "optim/lr": 4.5759203718920285e-07, "optim/total_tokens": 2003803570176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2718138694763184, "created_at": "2025-06-03T11:10:03.720464+00:00"} {"global_step": 238873, "acc_step": 0, "speed/wps": 5516.4364450159455, "speed/FLOPS": 243798255188352.7, "speed/curr_iter_time": 2.9691, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9691, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 197.01, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047840747982263565, "optim/lr": 4.540448120946561e-07, "optim/total_tokens": 2003811958784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2587785720825195, "created_at": "2025-06-03T11:10:06.697054+00:00"} {"global_step": 238874, "acc_step": 0, "speed/wps": 5513.408511666293, "speed/FLOPS": 243664436032665.88, "speed/curr_iter_time": 2.9707, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9707, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 197.12, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04775703325867653, "optim/lr": 4.504975870001093e-07, "optim/total_tokens": 2003820347392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2623182535171509, "created_at": "2025-06-03T11:10:09.676064+00:00"} {"global_step": 238875, "acc_step": 0, "speed/wps": 5520.934242447966, "speed/FLOPS": 243997034813033.78, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.061740435659885406, "optim/lr": 4.469503619055626e-07, "optim/total_tokens": 2003828736000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2517362833023071, "created_at": "2025-06-03T11:10:12.654356+00:00"} {"global_step": 238876, "acc_step": 0, "speed/wps": 5524.664415817083, "speed/FLOPS": 244161889383190.62, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04797923564910889, "optim/lr": 4.4340313681123787e-07, "optim/total_tokens": 2003837124608, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2531988620758057, "created_at": "2025-06-03T11:10:15.629064+00:00"} {"global_step": 238877, "acc_step": 0, "speed/wps": 5523.989564528213, "speed/FLOPS": 244132064410424.6, "speed/curr_iter_time": 2.9651, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9651, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.75, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04741063341498375, "optim/lr": 4.3985591171669116e-07, "optim/total_tokens": 2003845513216, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2562992572784424, "created_at": "2025-06-03T11:10:18.600320+00:00"} {"global_step": 238878, "acc_step": 0, "speed/wps": 5528.514108166382, "speed/FLOPS": 244332026080517.97, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04774274677038193, "optim/lr": 4.363086866221444e-07, "optim/total_tokens": 2003853901824, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2558947801589966, "created_at": "2025-06-03T11:10:21.569248+00:00"} {"global_step": 238879, "acc_step": 0, "speed/wps": 5526.018608173147, "speed/FLOPS": 244221737753943.84, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.68, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046849604696035385, "optim/lr": 4.3276146152759763e-07, "optim/total_tokens": 2003862290432, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2333366870880127, "created_at": "2025-06-03T11:10:24.541873+00:00"} {"global_step": 238880, "acc_step": 0, "speed/wps": 5528.678169453725, "speed/FLOPS": 244339276749676.72, "speed/curr_iter_time": 2.9626, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9626, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04667006433010101, "optim/lr": 4.2921423643327295e-07, "optim/total_tokens": 2003870679040, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2609118223190308, "created_at": "2025-06-03T11:10:27.510006+00:00"} {"global_step": 238881, "acc_step": 0, "speed/wps": 5519.266991103064, "speed/FLOPS": 243923350837355.1, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 196.83, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047475866973400116, "optim/lr": 4.256670113387262e-07, "optim/total_tokens": 2003879067648, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 419, "loss/out": 1.245258092880249, "created_at": "2025-06-03T11:10:30.483316+00:00"} {"global_step": 238882, "acc_step": 0, "speed/wps": 5502.705878959472, "speed/FLOPS": 243191434448064.62, "speed/curr_iter_time": 2.9766, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9766, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 197.52, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04692739620804787, "optim/lr": 4.2211978624417947e-07, "optim/total_tokens": 2003887456256, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.249415636062622, "created_at": "2025-06-03T11:10:33.465792+00:00"} {"global_step": 238883, "acc_step": 0, "speed/wps": 5514.231044548573, "speed/FLOPS": 243700787775957.72, "speed/curr_iter_time": 2.9703, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9703, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 197.1, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04752192273736, "optim/lr": 4.185725611496327e-07, "optim/total_tokens": 2003895844864, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2661585807800293, "created_at": "2025-06-03T11:10:36.441966+00:00"} {"global_step": 238884, "acc_step": 0, "speed/wps": 5503.934919618796, "speed/FLOPS": 243245751754406.38, "speed/curr_iter_time": 2.9759, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9759, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.1 hours", "speed/est_time_elapsed_hrs": 197.47, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.1, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047550056129693985, "optim/lr": 4.15025336055308e-07, "optim/total_tokens": 2003904233472, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2538821697235107, "created_at": "2025-06-03T11:10:39.422780+00:00"} {"global_step": 238885, "acc_step": 0, "speed/wps": 5528.472229593583, "speed/FLOPS": 244330175261954.2, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.5, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047325026243925095, "optim/lr": 4.1147811096076126e-07, "optim/total_tokens": 2003912622080, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 391, "loss/out": 1.2510688304901123, "created_at": "2025-06-03T11:10:42.390878+00:00"} {"global_step": 238886, "acc_step": 0, "speed/wps": 5528.79386277869, "speed/FLOPS": 244344389802468.03, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04826992377638817, "optim/lr": 4.079308858662145e-07, "optim/total_tokens": 2003921010688, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 365, "loss/out": 1.2493914365768433, "created_at": "2025-06-03T11:10:45.359016+00:00"} {"global_step": 238887, "acc_step": 0, "speed/wps": 5525.767317019063, "speed/FLOPS": 244210631971158.03, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047421425580978394, "optim/lr": 4.043836607716678e-07, "optim/total_tokens": 2003929399296, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2560601234436035, "created_at": "2025-06-03T11:10:48.331100+00:00"} {"global_step": 238888, "acc_step": 0, "speed/wps": 5520.559061278255, "speed/FLOPS": 243980453725683.84, "speed/curr_iter_time": 2.9655, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9655, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.78, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04748094454407692, "optim/lr": 4.0083643567734304e-07, "optim/total_tokens": 2003937787904, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.265860915184021, "created_at": "2025-06-03T11:10:51.303946+00:00"} {"global_step": 238889, "acc_step": 0, "speed/wps": 5522.496070502563, "speed/FLOPS": 244066059618886.28, "speed/curr_iter_time": 2.9658, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9658, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047449275851249695, "optim/lr": 3.9728921058279633e-07, "optim/total_tokens": 2003946176512, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 404, "loss/out": 1.2580136060714722, "created_at": "2025-06-03T11:10:54.274965+00:00"} {"global_step": 238890, "acc_step": 0, "speed/wps": 5509.745696360349, "speed/FLOPS": 243502558344131.44, "speed/curr_iter_time": 2.9728, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9728, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 197.27, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04692516103386879, "optim/lr": 3.9374198548824957e-07, "optim/total_tokens": 2003954565120, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2467697858810425, "created_at": "2025-06-03T11:10:57.253475+00:00"} {"global_step": 238891, "acc_step": 0, "speed/wps": 5519.961396849404, "speed/FLOPS": 243954040017052.5, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04706788808107376, "optim/lr": 3.901947603937028e-07, "optim/total_tokens": 2003962953728, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 361, "loss/out": 1.252530574798584, "created_at": "2025-06-03T11:11:00.226635+00:00"} {"global_step": 238892, "acc_step": 0, "speed/wps": 5519.380745380984, "speed/FLOPS": 243928378194191.97, "speed/curr_iter_time": 2.9676, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9676, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04712629318237305, "optim/lr": 3.866475352993781e-07, "optim/total_tokens": 2003971342336, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2487918138504028, "created_at": "2025-06-03T11:11:03.203313+00:00"} {"global_step": 238893, "acc_step": 0, "speed/wps": 5527.786423054919, "speed/FLOPS": 244299866123221.34, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04759787768125534, "optim/lr": 3.8310031020483136e-07, "optim/total_tokens": 2003979730944, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.261265754699707, "created_at": "2025-06-03T11:11:06.171900+00:00"} {"global_step": 238894, "acc_step": 0, "speed/wps": 5532.035778682199, "speed/FLOPS": 244487665891773.28, "speed/curr_iter_time": 2.9608, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9608, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.48, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047448523342609406, "optim/lr": 3.7955308511028464e-07, "optim/total_tokens": 2003988119552, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2517070770263672, "created_at": "2025-06-03T11:11:09.138049+00:00"} {"global_step": 238895, "acc_step": 0, "speed/wps": 5520.332352806488, "speed/FLOPS": 243970434371630.9, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04787276312708855, "optim/lr": 3.760058600159599e-07, "optim/total_tokens": 2003996508160, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2588088512420654, "created_at": "2025-06-03T11:11:12.111807+00:00"} {"global_step": 238896, "acc_step": 0, "speed/wps": 5527.642501615399, "speed/FLOPS": 244293505532251.25, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.09 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.09, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04751710966229439, "optim/lr": 3.724586349214132e-07, "optim/total_tokens": 2004004896768, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2444556951522827, "created_at": "2025-06-03T11:11:15.083561+00:00"} {"global_step": 238897, "acc_step": 0, "speed/wps": 5531.098423286503, "speed/FLOPS": 244446239581103.38, "speed/curr_iter_time": 2.9612, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9612, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.51, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04717058688402176, "optim/lr": 3.6891140982686643e-07, "optim/total_tokens": 2004013285376, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2421075105667114, "created_at": "2025-06-03T11:11:18.053061+00:00"} {"global_step": 238898, "acc_step": 0, "speed/wps": 5521.93987744165, "speed/FLOPS": 244041478732448.1, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04721496254205704, "optim/lr": 3.653641847323197e-07, "optim/total_tokens": 2004021673984, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.252242088317871, "created_at": "2025-06-03T11:11:21.027911+00:00"} {"global_step": 238899, "acc_step": 0, "speed/wps": 5511.134390908531, "speed/FLOPS": 243563931535178.03, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 197.22, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047715794295072556, "optim/lr": 3.61816959637995e-07, "optim/total_tokens": 2004030062592, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2501204013824463, "created_at": "2025-06-03T11:11:24.009686+00:00"} {"global_step": 238900, "acc_step": 0, "speed/wps": 5511.725601950476, "speed/FLOPS": 243590060037139.56, "speed/curr_iter_time": 2.9716, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9716, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 197.2, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0472857803106308, "optim/lr": 3.582697345434482e-07, "optim/total_tokens": 2004038451200, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.258428931236267, "created_at": "2025-06-03T11:11:26.986840+00:00"} {"global_step": 238901, "acc_step": 0, "speed/wps": 5526.304608122807, "speed/FLOPS": 244234377487838.34, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046699464321136475, "optim/lr": 3.547225094489015e-07, "optim/total_tokens": 2004046839808, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2591254711151123, "created_at": "2025-06-03T11:11:29.958901+00:00"} {"global_step": 238902, "acc_step": 0, "speed/wps": 5529.039902898791, "speed/FLOPS": 244355263516429.03, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.58, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.048365507274866104, "optim/lr": 3.5117528435435474e-07, "optim/total_tokens": 2004055228416, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2482596635818481, "created_at": "2025-06-03T11:11:32.926120+00:00"} {"global_step": 238903, "acc_step": 0, "speed/wps": 5532.390069784891, "speed/FLOPS": 244503323745086.03, "speed/curr_iter_time": 2.9605, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9605, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.46, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0476989708840847, "optim/lr": 3.4762805926003006e-07, "optim/total_tokens": 2004063617024, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2502139806747437, "created_at": "2025-06-03T11:11:35.891476+00:00"} {"global_step": 238904, "acc_step": 0, "speed/wps": 5523.280004236511, "speed/FLOPS": 244100705477390.16, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.79, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047695282846689224, "optim/lr": 3.440808341654833e-07, "optim/total_tokens": 2004072005632, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 387, "loss/out": 1.2634938955307007, "created_at": "2025-06-03T11:11:38.864731+00:00"} {"global_step": 238905, "acc_step": 0, "speed/wps": 5527.333688548951, "speed/FLOPS": 244279857575362.78, "speed/curr_iter_time": 2.9619, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9619, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 196.56, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04712250456213951, "optim/lr": 3.405336090709366e-07, "optim/total_tokens": 2004080394240, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2445690631866455, "created_at": "2025-06-03T11:11:41.833166+00:00"} {"global_step": 238906, "acc_step": 0, "speed/wps": 5507.565716240351, "speed/FLOPS": 243406214380977.3, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 197.34, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047115325927734375, "optim/lr": 3.369863839763898e-07, "optim/total_tokens": 2004088782848, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2510000467300415, "created_at": "2025-06-03T11:11:44.818708+00:00"} {"global_step": 238907, "acc_step": 0, "speed/wps": 5507.890249920746, "speed/FLOPS": 243420557108536.8, "speed/curr_iter_time": 2.9736, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9736, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 197.34, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04760192707180977, "optim/lr": 3.334391588820651e-07, "optim/total_tokens": 2004097171456, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.2488893270492554, "created_at": "2025-06-03T11:11:47.798194+00:00"} {"global_step": 238908, "acc_step": 0, "speed/wps": 5511.420060886288, "speed/FLOPS": 243576556686003.44, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.08 hours", "speed/est_time_elapsed_hrs": 197.11, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.08, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047227680683135986, "optim/lr": 3.2989193378751837e-07, "optim/total_tokens": 2004105560064, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2473945617675781, "created_at": "2025-06-03T11:11:50.779144+00:00"} {"global_step": 238909, "acc_step": 0, "speed/wps": 5524.425152114721, "speed/FLOPS": 244151315152208.88, "speed/curr_iter_time": 2.9647, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9647, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.75, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04841950535774231, "optim/lr": 3.263447086929716e-07, "optim/total_tokens": 2004113948672, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.242043137550354, "created_at": "2025-06-03T11:11:53.754348+00:00"} {"global_step": 238910, "acc_step": 0, "speed/wps": 5523.474647424389, "speed/FLOPS": 244109307710020.25, "speed/curr_iter_time": 2.9653, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9653, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.79, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047436825931072235, "optim/lr": 3.227974835984249e-07, "optim/total_tokens": 2004122337280, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2566609382629395, "created_at": "2025-06-03T11:11:56.725401+00:00"} {"global_step": 238911, "acc_step": 0, "speed/wps": 5525.1856066269675, "speed/FLOPS": 244184923349291.12, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.73, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04699132964015007, "optim/lr": 3.1925025850410016e-07, "optim/total_tokens": 2004130725888, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2615798711776733, "created_at": "2025-06-03T11:11:59.696664+00:00"} {"global_step": 238912, "acc_step": 0, "speed/wps": 5520.5339624888475, "speed/FLOPS": 243979344487659.28, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.8, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047547847032547, "optim/lr": 3.1570303340955345e-07, "optim/total_tokens": 2004139114496, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 386, "loss/out": 1.2303428649902344, "created_at": "2025-06-03T11:12:02.668710+00:00"} {"global_step": 238913, "acc_step": 0, "speed/wps": 5526.393034889853, "speed/FLOPS": 244238285498332.56, "speed/curr_iter_time": 2.9637, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9637, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046762049198150635, "optim/lr": 3.121558083150067e-07, "optim/total_tokens": 2004147503104, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.247597098350525, "created_at": "2025-06-03T11:12:05.640194+00:00"} {"global_step": 238914, "acc_step": 0, "speed/wps": 5518.819580159673, "speed/FLOPS": 243903577563714.0, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.95, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04652703180909157, "optim/lr": 3.086085832204599e-07, "optim/total_tokens": 2004155891712, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2555782794952393, "created_at": "2025-06-03T11:12:08.613890+00:00"} {"global_step": 238915, "acc_step": 0, "speed/wps": 5515.393100085955, "speed/FLOPS": 243752144682770.56, "speed/curr_iter_time": 2.9682, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9682, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04727698490023613, "optim/lr": 3.0506135812613523e-07, "optim/total_tokens": 2004164280320, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2408190965652466, "created_at": "2025-06-03T11:12:11.590581+00:00"} {"global_step": 238916, "acc_step": 0, "speed/wps": 5512.818400621274, "speed/FLOPS": 243638356144938.2, "speed/curr_iter_time": 2.971, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.971, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 197.17, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04738176241517067, "optim/lr": 3.0151413303158847e-07, "optim/total_tokens": 2004172668928, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.242929458618164, "created_at": "2025-06-03T11:12:14.567104+00:00"} {"global_step": 238917, "acc_step": 0, "speed/wps": 5519.689378722691, "speed/FLOPS": 243942018208166.75, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04788820818066597, "optim/lr": 2.9796690793704176e-07, "optim/total_tokens": 2004181057536, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2435325384140015, "created_at": "2025-06-03T11:12:17.543234+00:00"} {"global_step": 238918, "acc_step": 0, "speed/wps": 5524.327560681614, "speed/FLOPS": 244147002110383.78, "speed/curr_iter_time": 2.9634, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9634, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04810550808906555, "optim/lr": 2.94419682842495e-07, "optim/total_tokens": 2004189446144, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2568023204803467, "created_at": "2025-06-03T11:12:20.514589+00:00"} {"global_step": 238919, "acc_step": 0, "speed/wps": 5530.864838418418, "speed/FLOPS": 244435916325529.75, "speed/curr_iter_time": 2.9613, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9613, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.53, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04705646634101868, "optim/lr": 2.908724577481703e-07, "optim/total_tokens": 2004197834752, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2617106437683105, "created_at": "2025-06-03T11:12:23.484296+00:00"} {"global_step": 238920, "acc_step": 0, "speed/wps": 5521.282565542291, "speed/FLOPS": 244012428910923.72, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.07 hours", "speed/est_time_elapsed_hrs": 196.88, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.07, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0474180206656456, "optim/lr": 2.8732523265362354e-07, "optim/total_tokens": 2004206223360, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 394, "loss/out": 1.2334372997283936, "created_at": "2025-06-03T11:12:26.456049+00:00"} {"global_step": 238921, "acc_step": 0, "speed/wps": 5530.637988222671, "speed/FLOPS": 244425890708002.3, "speed/curr_iter_time": 2.9614, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9614, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.54, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047007013112306595, "optim/lr": 2.837780075590768e-07, "optim/total_tokens": 2004214611968, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 412, "loss/out": 1.2550930976867676, "created_at": "2025-06-03T11:12:29.422159+00:00"} {"global_step": 238922, "acc_step": 0, "speed/wps": 5526.066952505969, "speed/FLOPS": 244223874326005.84, "speed/curr_iter_time": 2.9624, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9624, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04755404219031334, "optim/lr": 2.802307824647521e-07, "optim/total_tokens": 2004223000576, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 405, "loss/out": 1.269448161125183, "created_at": "2025-06-03T11:12:32.392026+00:00"} {"global_step": 238923, "acc_step": 0, "speed/wps": 5525.446397704782, "speed/FLOPS": 244196448980080.78, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.73, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04677729681134224, "optim/lr": 2.7668355737020533e-07, "optim/total_tokens": 2004231389184, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 416, "loss/out": 1.245010495185852, "created_at": "2025-06-03T11:12:35.365350+00:00"} {"global_step": 238924, "acc_step": 0, "speed/wps": 5505.170825436409, "speed/FLOPS": 243300372465605.44, "speed/curr_iter_time": 2.9752, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9752, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 197.46, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04848777502775192, "optim/lr": 2.731363322756586e-07, "optim/total_tokens": 2004239777792, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 375, "loss/out": 1.2660863399505615, "created_at": "2025-06-03T11:12:38.350928+00:00"} {"global_step": 238925, "acc_step": 0, "speed/wps": 5508.757605341786, "speed/FLOPS": 243458889778619.28, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 197.24, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04780431464314461, "optim/lr": 2.6958910718111185e-07, "optim/total_tokens": 2004248166400, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 362, "loss/out": 1.245996356010437, "created_at": "2025-06-03T11:12:41.329692+00:00"} {"global_step": 238926, "acc_step": 0, "speed/wps": 5514.618351778066, "speed/FLOPS": 243717904773083.22, "speed/curr_iter_time": 2.9701, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9701, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 197.12, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0473393015563488, "optim/lr": 2.6604188208678717e-07, "optim/total_tokens": 2004256555008, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2611826658248901, "created_at": "2025-06-03T11:12:44.304914+00:00"} {"global_step": 238927, "acc_step": 0, "speed/wps": 5532.698562457071, "speed/FLOPS": 244516957542187.75, "speed/curr_iter_time": 2.9603, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9603, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.47, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047724705189466476, "optim/lr": 2.624946569922404e-07, "optim/total_tokens": 2004264943616, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2664694786071777, "created_at": "2025-06-03T11:12:47.274371+00:00"} {"global_step": 238928, "acc_step": 0, "speed/wps": 5524.853912281773, "speed/FLOPS": 244170264156999.1, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04705781489610672, "optim/lr": 2.5894743189769364e-07, "optim/total_tokens": 2004273332224, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2449673414230347, "created_at": "2025-06-03T11:12:50.243902+00:00"} {"global_step": 238929, "acc_step": 0, "speed/wps": 5530.12707615993, "speed/FLOPS": 244403311009914.16, "speed/curr_iter_time": 2.9617, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9617, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04741663858294487, "optim/lr": 2.5540020680314693e-07, "optim/total_tokens": 2004281720832, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2375887632369995, "created_at": "2025-06-03T11:12:53.214640+00:00"} {"global_step": 238930, "acc_step": 0, "speed/wps": 5520.178454021341, "speed/FLOPS": 243963632833052.78, "speed/curr_iter_time": 2.967, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.967, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.92, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04725266247987747, "optim/lr": 2.518529817088222e-07, "optim/total_tokens": 2004290109440, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 378, "loss/out": 1.2477983236312866, "created_at": "2025-06-03T11:12:56.186626+00:00"} {"global_step": 238931, "acc_step": 0, "speed/wps": 5526.193952896828, "speed/FLOPS": 244229487093234.88, "speed/curr_iter_time": 2.9638, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9638, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.71, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04725079983472824, "optim/lr": 2.483057566142755e-07, "optim/total_tokens": 2004298498048, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.257591724395752, "created_at": "2025-06-03T11:12:59.160110+00:00"} {"global_step": 238932, "acc_step": 0, "speed/wps": 5527.015879576415, "speed/FLOPS": 244265812045470.5, "speed/curr_iter_time": 2.962, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.962, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 196.59, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04781403765082359, "optim/lr": 2.447585315197287e-07, "optim/total_tokens": 2004306886656, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2575887441635132, "created_at": "2025-06-03T11:13:02.131693+00:00"} {"global_step": 238933, "acc_step": 0, "speed/wps": 5513.8407803656955, "speed/FLOPS": 243683540096627.72, "speed/curr_iter_time": 2.9705, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9705, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.06 hours", "speed/est_time_elapsed_hrs": 197.15, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.06, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046999868005514145, "optim/lr": 2.4121130642518195e-07, "optim/total_tokens": 2004315275264, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2490895986557007, "created_at": "2025-06-03T11:13:05.108168+00:00"} {"global_step": 238934, "acc_step": 0, "speed/wps": 5528.770806259971, "speed/FLOPS": 244343370822354.62, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04752136766910553, "optim/lr": 2.3766408133085727e-07, "optim/total_tokens": 2004323663872, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2421363592147827, "created_at": "2025-06-03T11:13:08.081050+00:00"} {"global_step": 238935, "acc_step": 0, "speed/wps": 5535.675846993363, "speed/FLOPS": 244648538279568.12, "speed/curr_iter_time": 2.9575, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9575, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.29, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04683256149291992, "optim/lr": 2.341168562363105e-07, "optim/total_tokens": 2004332052480, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2641953229904175, "created_at": "2025-06-03T11:13:11.045523+00:00"} {"global_step": 238936, "acc_step": 0, "speed/wps": 5523.075222340963, "speed/FLOPS": 244091655165775.72, "speed/curr_iter_time": 2.9654, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9654, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.82, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04711204394698143, "optim/lr": 2.3056963114176377e-07, "optim/total_tokens": 2004340441088, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 389, "loss/out": 1.2311521768569946, "created_at": "2025-06-03T11:13:14.015950+00:00"} {"global_step": 238937, "acc_step": 0, "speed/wps": 5535.563140967486, "speed/FLOPS": 244643557250106.12, "speed/curr_iter_time": 2.9588, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9588, "speed/est_time_elapsed": "8.18 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.38, "speed/est_time_elapsed_days": 8.18, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047348495572805405, "optim/lr": 2.2702240604721703e-07, "optim/total_tokens": 2004348829696, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2467434406280518, "created_at": "2025-06-03T11:13:16.979855+00:00"} {"global_step": 238938, "acc_step": 0, "speed/wps": 5521.50893138581, "speed/FLOPS": 244022433122561.8, "speed/curr_iter_time": 2.9663, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9663, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.88, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046962156891822815, "optim/lr": 2.2347518095289232e-07, "optim/total_tokens": 2004357218304, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 414, "loss/out": 1.2496662139892578, "created_at": "2025-06-03T11:13:19.957828+00:00"} {"global_step": 238939, "acc_step": 0, "speed/wps": 5524.888551818315, "speed/FLOPS": 244171795047213.03, "speed/curr_iter_time": 2.9632, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9632, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.67, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047644391655921936, "optim/lr": 2.1992795585834558e-07, "optim/total_tokens": 2004365606912, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2423537969589233, "created_at": "2025-06-03T11:13:22.928390+00:00"} {"global_step": 238940, "acc_step": 0, "speed/wps": 5523.957773947107, "speed/FLOPS": 244130659429458.66, "speed/curr_iter_time": 2.965, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.965, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.79, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04690709710121155, "optim/lr": 2.1638073076379882e-07, "optim/total_tokens": 2004373995520, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.261252760887146, "created_at": "2025-06-03T11:13:25.898744+00:00"} {"global_step": 238941, "acc_step": 0, "speed/wps": 5514.286988992651, "speed/FLOPS": 243703260234036.3, "speed/curr_iter_time": 2.9702, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9702, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 197.14, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04709754139184952, "optim/lr": 2.1283350566925208e-07, "optim/total_tokens": 2004382384128, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2630335092544556, "created_at": "2025-06-03T11:13:28.874135+00:00"} {"global_step": 238942, "acc_step": 0, "speed/wps": 5510.315747602928, "speed/FLOPS": 243527751691266.7, "speed/curr_iter_time": 2.9709, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9709, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 197.19, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0476076565682888, "optim/lr": 2.0928628057492737e-07, "optim/total_tokens": 2004390772736, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2738827466964722, "created_at": "2025-06-03T11:13:31.854088+00:00"} {"global_step": 238943, "acc_step": 0, "speed/wps": 5530.256038667579, "speed/FLOPS": 244409010492662.28, "speed/curr_iter_time": 2.9616, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9616, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.57, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047235868871212006, "optim/lr": 2.0573905548038063e-07, "optim/total_tokens": 2004399161344, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2568132877349854, "created_at": "2025-06-03T11:13:34.820816+00:00"} {"global_step": 238944, "acc_step": 0, "speed/wps": 5525.735144525167, "speed/FLOPS": 244209210111601.6, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.74, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047192540019750595, "optim/lr": 2.021918303858339e-07, "optim/total_tokens": 2004407549952, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 382, "loss/out": 1.2539256811141968, "created_at": "2025-06-03T11:13:37.794718+00:00"} {"global_step": 238945, "acc_step": 0, "speed/wps": 5526.764956096448, "speed/FLOPS": 244254722511998.78, "speed/curr_iter_time": 2.9622, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9622, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.05 hours", "speed/est_time_elapsed_hrs": 196.61, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.05, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047490619122982025, "optim/lr": 1.9864460529128715e-07, "optim/total_tokens": 2004415938560, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.24642014503479, "created_at": "2025-06-03T11:13:40.767604+00:00"} {"global_step": 238946, "acc_step": 0, "speed/wps": 5517.146189279823, "speed/FLOPS": 243829622252015.62, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04898056387901306, "optim/lr": 1.9509738019696244e-07, "optim/total_tokens": 2004424327168, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.260083794593811, "created_at": "2025-06-03T11:13:43.742169+00:00"} {"global_step": 238947, "acc_step": 0, "speed/wps": 5523.51928408163, "speed/FLOPS": 244111280421799.16, "speed/curr_iter_time": 2.9652, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9652, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.81, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04748089611530304, "optim/lr": 1.9155015510241568e-07, "optim/total_tokens": 2004432715776, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2581464052200317, "created_at": "2025-06-03T11:13:46.712824+00:00"} {"global_step": 238948, "acc_step": 0, "speed/wps": 5525.003642819488, "speed/FLOPS": 244176881480375.72, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04692095145583153, "optim/lr": 1.8800293000786894e-07, "optim/total_tokens": 2004441104384, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.25492262840271, "created_at": "2025-06-03T11:13:49.688330+00:00"} {"global_step": 238949, "acc_step": 0, "speed/wps": 5519.351308300808, "speed/FLOPS": 243927077225920.84, "speed/curr_iter_time": 2.9661, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9661, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047038186341524124, "optim/lr": 1.8445570491354423e-07, "optim/total_tokens": 2004449492992, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.2591969966888428, "created_at": "2025-06-03T11:13:52.665239+00:00"} {"global_step": 238950, "acc_step": 0, "speed/wps": 5504.796325898846, "speed/FLOPS": 243283821502907.53, "speed/curr_iter_time": 2.9753, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9753, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 197.49, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047663457691669464, "optim/lr": 1.809084798189975e-07, "optim/total_tokens": 2004457881600, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2492055892944336, "created_at": "2025-06-03T11:13:55.646650+00:00"} {"global_step": 238951, "acc_step": 0, "speed/wps": 5505.178287099412, "speed/FLOPS": 243300702232917.9, "speed/curr_iter_time": 2.9751, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9751, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 197.47, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047155559062957764, "optim/lr": 1.7736125472445075e-07, "optim/total_tokens": 2004466270208, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2522104978561401, "created_at": "2025-06-03T11:13:58.628002+00:00"} {"global_step": 238952, "acc_step": 0, "speed/wps": 5519.6022192810715, "speed/FLOPS": 243938166206969.66, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04734066128730774, "optim/lr": 1.7381402962990402e-07, "optim/total_tokens": 2004474658816, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 377, "loss/out": 1.2664973735809326, "created_at": "2025-06-03T11:14:01.604477+00:00"} {"global_step": 238953, "acc_step": 0, "speed/wps": 5529.101680381094, "speed/FLOPS": 244357993764941.0, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.63, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04732338339090347, "optim/lr": 1.702668045355793e-07, "optim/total_tokens": 2004483047424, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 400, "loss/out": 1.264204978942871, "created_at": "2025-06-03T11:14:04.574482+00:00"} {"global_step": 238954, "acc_step": 0, "speed/wps": 5522.08316320593, "speed/FLOPS": 244047811229826.22, "speed/curr_iter_time": 2.966, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.966, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04733436927199364, "optim/lr": 1.6671957944103254e-07, "optim/total_tokens": 2004491436032, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 392, "loss/out": 1.2465356588363647, "created_at": "2025-06-03T11:14:07.546306+00:00"} {"global_step": 238955, "acc_step": 0, "speed/wps": 5514.891936267453, "speed/FLOPS": 243729995807181.75, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 197.03, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047813620418310165, "optim/lr": 1.631723543464858e-07, "optim/total_tokens": 2004499824640, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.250131607055664, "created_at": "2025-06-03T11:14:10.521301+00:00"} {"global_step": 238956, "acc_step": 0, "speed/wps": 5517.497892188138, "speed/FLOPS": 243845165720384.47, "speed/curr_iter_time": 2.9685, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9685, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04704991728067398, "optim/lr": 1.5962512925193906e-07, "optim/total_tokens": 2004508213248, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.2570703029632568, "created_at": "2025-06-03T11:14:13.498704+00:00"} {"global_step": 238957, "acc_step": 0, "speed/wps": 5522.74489787009, "speed/FLOPS": 244077056514917.06, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.04 hours", "speed/est_time_elapsed_hrs": 196.85, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.04, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047031089663505554, "optim/lr": 1.5607790415761435e-07, "optim/total_tokens": 2004516601856, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.2335022687911987, "created_at": "2025-06-03T11:14:16.469602+00:00"} {"global_step": 238958, "acc_step": 0, "speed/wps": 5525.530223492261, "speed/FLOPS": 244200153650828.1, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04729057103395462, "optim/lr": 1.5253067906306762e-07, "optim/total_tokens": 2004524990464, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 384, "loss/out": 1.2559924125671387, "created_at": "2025-06-03T11:14:19.439453+00:00"} {"global_step": 238959, "acc_step": 0, "speed/wps": 5513.580307328904, "speed/FLOPS": 243672028521623.4, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 197.09, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04735748842358589, "optim/lr": 1.4898345396852088e-07, "optim/total_tokens": 2004533379072, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2431992292404175, "created_at": "2025-06-03T11:14:22.418667+00:00"} {"global_step": 238960, "acc_step": 0, "speed/wps": 5528.594566947221, "speed/FLOPS": 244335581946805.66, "speed/curr_iter_time": 2.9625, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9625, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.64, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047568801790475845, "optim/lr": 1.4543622887397411e-07, "optim/total_tokens": 2004541767680, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 411, "loss/out": 1.233615517616272, "created_at": "2025-06-03T11:14:25.387504+00:00"} {"global_step": 238961, "acc_step": 0, "speed/wps": 5517.600608853574, "speed/FLOPS": 243849705271245.2, "speed/curr_iter_time": 2.9684, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9684, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047436557710170746, "optim/lr": 1.4188900377964943e-07, "optim/total_tokens": 2004550156288, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2501856088638306, "created_at": "2025-06-03T11:14:28.361590+00:00"} {"global_step": 238962, "acc_step": 0, "speed/wps": 5526.609656294719, "speed/FLOPS": 244247859055658.78, "speed/curr_iter_time": 2.9621, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9621, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04689837619662285, "optim/lr": 1.3834177868510267e-07, "optim/total_tokens": 2004558544896, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 396, "loss/out": 1.2528287172317505, "created_at": "2025-06-03T11:14:31.334441+00:00"} {"global_step": 238963, "acc_step": 0, "speed/wps": 5525.529990933402, "speed/FLOPS": 244200143372916.84, "speed/curr_iter_time": 2.9642, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9642, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04720982164144516, "optim/lr": 1.3479455359055593e-07, "optim/total_tokens": 2004566933504, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 385, "loss/out": 1.2574657201766968, "created_at": "2025-06-03T11:14:34.303952+00:00"} {"global_step": 238964, "acc_step": 0, "speed/wps": 5525.080463049565, "speed/FLOPS": 244180276541343.56, "speed/curr_iter_time": 2.9644, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9644, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04696043208241463, "optim/lr": 1.312473284960092e-07, "optim/total_tokens": 2004575322112, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.2571005821228027, "created_at": "2025-06-03T11:14:37.274432+00:00"} {"global_step": 238965, "acc_step": 0, "speed/wps": 5516.080143970916, "speed/FLOPS": 243782508505876.44, "speed/curr_iter_time": 2.9677, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9677, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.99, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04693766310811043, "optim/lr": 1.2770010340168448e-07, "optim/total_tokens": 2004583710720, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2462615966796875, "created_at": "2025-06-03T11:14:40.251974+00:00"} {"global_step": 238966, "acc_step": 0, "speed/wps": 5520.598044717284, "speed/FLOPS": 243982176594153.6, "speed/curr_iter_time": 2.9668, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9668, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04828658327460289, "optim/lr": 1.2415287830713774e-07, "optim/total_tokens": 2004592099328, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 364, "loss/out": 1.2563812732696533, "created_at": "2025-06-03T11:14:43.230330+00:00"} {"global_step": 238967, "acc_step": 0, "speed/wps": 5518.582010440886, "speed/FLOPS": 243893078198135.66, "speed/curr_iter_time": 2.9679, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9679, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 197.01, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04733341187238693, "optim/lr": 1.2060565321259098e-07, "optim/total_tokens": 2004600487936, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 360, "loss/out": 1.2542359828948975, "created_at": "2025-06-03T11:14:46.203901+00:00"} {"global_step": 238968, "acc_step": 0, "speed/wps": 5521.386491079101, "speed/FLOPS": 244017021887711.6, "speed/curr_iter_time": 2.9664, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9664, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.91, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04697387292981148, "optim/lr": 1.1705842811804424e-07, "optim/total_tokens": 2004608876544, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 373, "loss/out": 1.2361031770706177, "created_at": "2025-06-03T11:14:49.176301+00:00"} {"global_step": 238969, "acc_step": 0, "speed/wps": 5525.17434890755, "speed/FLOPS": 244184425815715.1, "speed/curr_iter_time": 2.9631, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9631, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.03 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.03, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04702398180961609, "optim/lr": 1.1351120302371953e-07, "optim/total_tokens": 2004617265152, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 371, "loss/out": 1.2514469623565674, "created_at": "2025-06-03T11:14:52.150641+00:00"} {"global_step": 238970, "acc_step": 0, "speed/wps": 5531.423688376896, "speed/FLOPS": 244460614633241.12, "speed/curr_iter_time": 2.961, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.961, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.55, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047308068722486496, "optim/lr": 1.0996397792917279e-07, "optim/total_tokens": 2004625653760, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 409, "loss/out": 1.248795986175537, "created_at": "2025-06-03T11:14:55.117439+00:00"} {"global_step": 238971, "acc_step": 0, "speed/wps": 5526.793031174863, "speed/FLOPS": 244255963286763.44, "speed/curr_iter_time": 2.9635, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9635, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.72, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04727980121970177, "optim/lr": 1.0641675283462604e-07, "optim/total_tokens": 2004634042368, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.250706672668457, "created_at": "2025-06-03T11:14:58.086309+00:00"} {"global_step": 238972, "acc_step": 0, "speed/wps": 5522.986529791479, "speed/FLOPS": 244087735409058.16, "speed/curr_iter_time": 2.9641, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9641, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.76, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04711980000138283, "optim/lr": 1.028695277400793e-07, "optim/total_tokens": 2004642430976, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 402, "loss/out": 1.247884750366211, "created_at": "2025-06-03T11:15:01.056747+00:00"} {"global_step": 238973, "acc_step": 0, "speed/wps": 5522.749047639024, "speed/FLOPS": 244077239913463.47, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04775025323033333, "optim/lr": 9.932230264575459e-08, "optim/total_tokens": 2004650819584, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 397, "loss/out": 1.2329895496368408, "created_at": "2025-06-03T11:15:04.031687+00:00"} {"global_step": 238974, "acc_step": 0, "speed/wps": 5522.807374354473, "speed/FLOPS": 244079817655743.12, "speed/curr_iter_time": 2.9657, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9657, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.87, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04811253398656845, "optim/lr": 9.577507755120784e-08, "optim/total_tokens": 2004659208192, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 413, "loss/out": 1.2561601400375366, "created_at": "2025-06-03T11:15:07.006729+00:00"} {"global_step": 238975, "acc_step": 0, "speed/wps": 5519.610008459942, "speed/FLOPS": 243938510448807.1, "speed/curr_iter_time": 2.9673, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9673, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04743672162294388, "optim/lr": 9.22278524566611e-08, "optim/total_tokens": 2004667596800, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 366, "loss/out": 1.2539803981781006, "created_at": "2025-06-03T11:15:09.980158+00:00"} {"global_step": 238976, "acc_step": 0, "speed/wps": 5514.375541929031, "speed/FLOPS": 243707173820569.3, "speed/curr_iter_time": 2.9687, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9687, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 197.07, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.0478028878569603, "optim/lr": 8.868062736233639e-08, "optim/total_tokens": 2004675985408, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2420083284378052, "created_at": "2025-06-03T11:15:12.956659+00:00"} {"global_step": 238977, "acc_step": 0, "speed/wps": 5531.762921926395, "speed/FLOPS": 244475607019774.25, "speed/curr_iter_time": 2.9609, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9609, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.55, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04753853753209114, "optim/lr": 8.513340226778965e-08, "optim/total_tokens": 2004684374016, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 372, "loss/out": 1.2501360177993774, "created_at": "2025-06-03T11:15:15.926590+00:00"} {"global_step": 238978, "acc_step": 0, "speed/wps": 5528.02231841123, "speed/FLOPS": 244310291490548.38, "speed/curr_iter_time": 2.9629, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9629, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.69, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047669291496276855, "optim/lr": 8.15861771732429e-08, "optim/total_tokens": 2004692762624, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2507355213165283, "created_at": "2025-06-03T11:15:18.894386+00:00"} {"global_step": 238979, "acc_step": 0, "speed/wps": 5526.123784422362, "speed/FLOPS": 244226386005818.3, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.65, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04716562107205391, "optim/lr": 7.803895207869616e-08, "optim/total_tokens": 2004701151232, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2510985136032104, "created_at": "2025-06-03T11:15:21.863409+00:00"} {"global_step": 238980, "acc_step": 0, "speed/wps": 5521.192890450292, "speed/FLOPS": 244008465730856.1, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04817851632833481, "optim/lr": 7.449172698437145e-08, "optim/total_tokens": 2004709539840, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.26095449924469, "created_at": "2025-06-03T11:15:24.838105+00:00"} {"global_step": 238981, "acc_step": 0, "speed/wps": 5511.217557259741, "speed/FLOPS": 243567607062217.53, "speed/curr_iter_time": 2.9719, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9719, "speed/est_time_elapsed": "8.22 days", "speed/est_time_remaining": "0.02 hours", "speed/est_time_elapsed_hrs": 197.29, "speed/est_time_elapsed_days": 8.22, "speed/est_time_remaining_hrs": 0.02, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04738273099064827, "optim/lr": 7.094450188982472e-08, "optim/total_tokens": 2004717928448, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 410, "loss/out": 1.2501871585845947, "created_at": "2025-06-03T11:15:27.818915+00:00"} {"global_step": 238982, "acc_step": 0, "speed/wps": 5514.176883208463, "speed/FLOPS": 243698394121947.72, "speed/curr_iter_time": 2.9688, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9688, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.08, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04755867272615433, "optim/lr": 6.739727679527796e-08, "optim/total_tokens": 2004726317056, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 381, "loss/out": 1.2483853101730347, "created_at": "2025-06-03T11:15:30.794307+00:00"} {"global_step": 238983, "acc_step": 0, "speed/wps": 5516.644459018001, "speed/FLOPS": 243807448342531.34, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.09, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04749106988310814, "optim/lr": 6.385005170073121e-08, "optim/total_tokens": 2004734705664, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.262050747871399, "created_at": "2025-06-03T11:15:33.768470+00:00"} {"global_step": 238984, "acc_step": 0, "speed/wps": 5505.524834180692, "speed/FLOPS": 243316017840121.72, "speed/curr_iter_time": 2.9749, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9749, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.49, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047254811972379684, "optim/lr": 6.030282660640652e-08, "optim/total_tokens": 2004743094272, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2451175451278687, "created_at": "2025-06-03T11:15:36.749707+00:00"} {"global_step": 238985, "acc_step": 0, "speed/wps": 5507.384531392832, "speed/FLOPS": 243398206938105.1, "speed/curr_iter_time": 2.974, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.974, "speed/est_time_elapsed": "8.23 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.43, "speed/est_time_elapsed_days": 8.23, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04715166985988617, "optim/lr": 5.6755601511859764e-08, "optim/total_tokens": 2004751482880, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 369, "loss/out": 1.2505347728729248, "created_at": "2025-06-03T11:15:39.729881+00:00"} {"global_step": 238986, "acc_step": 0, "speed/wps": 5527.499825973456, "speed/FLOPS": 244287199999157.5, "speed/curr_iter_time": 2.9618, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9618, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 196.62, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047378428280353546, "optim/lr": 5.320837641731302e-08, "optim/total_tokens": 2004759871488, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 383, "loss/out": 1.2662543058395386, "created_at": "2025-06-03T11:15:42.698049+00:00"} {"global_step": 238987, "acc_step": 0, "speed/wps": 5521.15537579323, "speed/FLOPS": 244006807775031.34, "speed/curr_iter_time": 2.9665, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9665, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 196.93, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04684227705001831, "optim/lr": 4.9661151322766274e-08, "optim/total_tokens": 2004768260096, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.2501455545425415, "created_at": "2025-06-03T11:15:45.674484+00:00"} {"global_step": 238988, "acc_step": 0, "speed/wps": 5514.895177407689, "speed/FLOPS": 243730139048990.5, "speed/curr_iter_time": 2.9699, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9699, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.16, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.046874769032001495, "optim/lr": 4.611392622844157e-08, "optim/total_tokens": 2004776648704, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 374, "loss/out": 1.2643296718597412, "created_at": "2025-06-03T11:15:48.649725+00:00"} {"global_step": 238989, "acc_step": 0, "speed/wps": 5514.158952091639, "speed/FLOPS": 243697601658363.88, "speed/curr_iter_time": 2.969, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.969, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.1, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047430794686079025, "optim/lr": 4.2566701133894826e-08, "optim/total_tokens": 2004785037312, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 390, "loss/out": 1.2676951885223389, "created_at": "2025-06-03T11:15:51.625302+00:00"} {"global_step": 238990, "acc_step": 0, "speed/wps": 5521.791113204232, "speed/FLOPS": 244034904114598.6, "speed/curr_iter_time": 2.9662, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9662, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 196.91, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04747329279780388, "optim/lr": 3.901947603934808e-08, "optim/total_tokens": 2004793425920, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.24844491481781, "created_at": "2025-06-03T11:15:54.600937+00:00"} {"global_step": 238991, "acc_step": 0, "speed/wps": 5518.278418144748, "speed/FLOPS": 243879660972572.6, "speed/curr_iter_time": 2.9681, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9681, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047384656965732574, "optim/lr": 3.547225094480133e-08, "optim/total_tokens": 2004801814528, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 401, "loss/out": 1.2621718645095825, "created_at": "2025-06-03T11:15:57.574193+00:00"} {"global_step": 238992, "acc_step": 0, "speed/wps": 5514.168563618961, "speed/FLOPS": 243698026438675.28, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 197.1, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04726429656147957, "optim/lr": 3.192502585047663e-08, "optim/total_tokens": 2004810203136, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 368, "loss/out": 1.2472609281539917, "created_at": "2025-06-03T11:16:00.553346+00:00"} {"global_step": 238993, "acc_step": 0, "speed/wps": 5528.965316211383, "speed/FLOPS": 244351967166614.84, "speed/curr_iter_time": 2.9623, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9623, "speed/est_time_elapsed": "8.19 days", "speed/est_time_remaining": "0.01 hours", "speed/est_time_elapsed_hrs": 196.66, "speed/est_time_elapsed_days": 8.19, "speed/est_time_remaining_hrs": 0.01, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04809693619608879, "optim/lr": 2.8377800755929882e-08, "optim/total_tokens": 2004818591744, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 370, "loss/out": 1.2512485980987549, "created_at": "2025-06-03T11:16:03.520768+00:00"} {"global_step": 238994, "acc_step": 0, "speed/wps": 5542.545152742008, "speed/FLOPS": 244952126433364.1, "speed/curr_iter_time": 2.9551, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9551, "speed/est_time_elapsed": "8.17 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 196.18, "speed/est_time_elapsed_days": 8.17, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04771140217781067, "optim/lr": 2.4830575661383137e-08, "optim/total_tokens": 2004826980352, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 408, "loss/out": 1.2492941617965698, "created_at": "2025-06-03T11:16:06.483925+00:00"} {"global_step": 238995, "acc_step": 0, "speed/wps": 5519.894082810743, "speed/FLOPS": 243951065081088.2, "speed/curr_iter_time": 2.9672, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9672, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 196.98, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04681655764579773, "optim/lr": 2.128335056683639e-08, "optim/total_tokens": 2004835368960, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 406, "loss/out": 1.2442083358764648, "created_at": "2025-06-03T11:16:09.456742+00:00"} {"global_step": 238996, "acc_step": 0, "speed/wps": 5523.114081362786, "speed/FLOPS": 244093372535641.8, "speed/curr_iter_time": 2.964, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.964, "speed/est_time_elapsed": "8.2 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 196.77, "speed/est_time_elapsed_days": 8.2, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047301530838012695, "optim/lr": 1.773612547251169e-08, "optim/total_tokens": 2004843757568, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 367, "loss/out": 1.2516924142837524, "created_at": "2025-06-03T11:16:12.428939+00:00"} {"global_step": 238997, "acc_step": 0, "speed/wps": 5516.04502199161, "speed/FLOPS": 243780956294161.72, "speed/curr_iter_time": 2.9693, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9693, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 197.13, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04789962247014046, "optim/lr": 1.4188900377964941e-08, "optim/total_tokens": 2004852146176, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 363, "loss/out": 1.254172682762146, "created_at": "2025-06-03T11:16:15.403431+00:00"} {"global_step": 238998, "acc_step": 0, "speed/wps": 5516.204646465704, "speed/FLOPS": 243788010878884.56, "speed/curr_iter_time": 2.9692, "speed/data_load_time": 0.0006, "speed/curr_step_time": 2.9692, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 197.12, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04755503311753273, "optim/lr": 1.0641675283418194e-08, "optim/total_tokens": 2004860534784, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 398, "loss/out": 1.25467050075531, "created_at": "2025-06-03T11:16:18.381851+00:00"} {"global_step": 238999, "acc_step": 0, "speed/wps": 5516.176897657886, "speed/FLOPS": 243786784523610.28, "speed/curr_iter_time": 2.968, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.968, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 197.04, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.04682234302163124, "optim/lr": 7.094450188871449e-09, "optim/total_tokens": 2004868923392, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 403, "loss/out": 1.2360833883285522, "created_at": "2025-06-03T11:16:21.355892+00:00"} {"global_step": 239000, "acc_step": 0, "speed/wps": 5516.655435487414, "speed/FLOPS": 243807933446296.75, "speed/curr_iter_time": 2.9689, "speed/data_load_time": 0.0007, "speed/curr_step_time": 2.9689, "speed/est_time_elapsed": "8.21 days", "speed/est_time_remaining": "0.0 hours", "speed/est_time_elapsed_hrs": 197.1, "speed/est_time_elapsed_days": 8.21, "speed/est_time_remaining_hrs": 0.0, "speed/est_time_remaining_days": 0.0, "optim/grad_norm": 0.047519881278276443, "optim/lr": 3.5472250945467465e-09, "optim/total_tokens": 2004877312000, "memory/max_active_gib": 82.03078985214233, "memory/max_active_pct": 64.0865545719862, "memory/max_reserved_gib": 85.4765625, "memory/max_reserved_pct": 66.778564453125, "memory/num_alloc_retries": 0, "memory/num_ooms": 0, "memory/power_draw": 388, "loss/out": 1.26225745677948, "created_at": "2025-06-03T11:16:24.332519+00:00"}